-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcreate_zones_and_tiles.py
542 lines (445 loc) · 18 KB
/
create_zones_and_tiles.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
#!/usr/bin/env python3
"""
Pokemon Map Data Restructuring
This script creates a more structured database schema with tiles table,
and extracts 16x16 pixel tile images from the existing tilesets.
The script:
1. Creates a "tiles" table with x, y coordinates, map_id, and tile_image_id
2. Extracts 16x16 pixel tile images from the existing tilesets
Usage:
python create_zones_and_tiles.py
"""
import os
import sqlite3
import binascii
from PIL import Image
from pathlib import Path
import sys
import time
import hashlib
import io
import re
# Constants
# Get the project root directory (parent of the script's directory)
PROJECT_ROOT = Path(__file__).resolve().parent.parent
DB_PATH = PROJECT_ROOT / "pokemon.db"
TILE_IMAGES_DIR = "tile_images"
BATCH_SIZE = 1000 # Number of tiles to insert in a single batch
def create_new_tables():
"""Create new tiles and tile_images tables in the database"""
conn = sqlite3.connect(DB_PATH)
cursor = conn.cursor()
# Drop existing tables if they exist
cursor.execute("DROP TABLE IF EXISTS tiles")
cursor.execute("DROP TABLE IF EXISTS tile_images")
# Create tiles table
cursor.execute(
"""
CREATE TABLE IF NOT EXISTS tiles (
id INTEGER PRIMARY KEY AUTOINCREMENT,
x INTEGER NOT NULL,
y INTEGER NOT NULL,
local_x INTEGER NOT NULL,
local_y INTEGER NOT NULL,
map_id INTEGER NOT NULL,
tile_image_id INTEGER NOT NULL,
is_overworld INTEGER NOT NULL DEFAULT 0,
FOREIGN KEY (map_id) REFERENCES maps (id),
FOREIGN KEY (tile_image_id) REFERENCES tile_images (id)
)
"""
)
# Create tile_images table with image_hash for deduplication
cursor.execute(
"""
CREATE TABLE IF NOT EXISTS tile_images (
id INTEGER PRIMARY KEY AUTOINCREMENT,
tileset_id INTEGER NOT NULL,
block_index INTEGER NOT NULL,
position INTEGER NOT NULL, -- 0: top-left, 1: top-right, 2: bottom-left, 3: bottom-right
image_path TEXT NOT NULL,
image_hash TEXT NOT NULL,
FOREIGN KEY (tileset_id) REFERENCES tilesets (id)
)
"""
)
# Create indexes for better performance
cursor.execute("CREATE INDEX IF NOT EXISTS idx_tiles_map_id ON tiles (map_id)")
cursor.execute(
"CREATE INDEX IF NOT EXISTS idx_tiles_tile_image_id ON tiles (tile_image_id)"
)
cursor.execute(
"CREATE INDEX IF NOT EXISTS idx_tile_images_tileset_id ON tile_images (tileset_id)"
)
cursor.execute(
"CREATE INDEX IF NOT EXISTS idx_tile_images_hash ON tile_images (image_hash)"
)
conn.commit()
return conn
def decode_2bpp_tile(tile_data):
"""Decode a 2bpp tile into a 2D array of pixel values (0-3)
Each tile is 8x8 pixels, with 2 bits per pixel.
Pixels are spread across neighboring bytes.
"""
pixels = []
# Process 16 bytes (8 rows of 2 bytes each)
for row in range(8):
row_pixels = []
# Each row is represented by 2 bytes
byte1 = tile_data[row * 2]
byte2 = tile_data[row * 2 + 1]
# Process each bit in the bytes
for bit in range(8):
# Extract the bit from each byte (from MSB to LSB)
bit_pos = 7 - bit
bit1 = (byte1 >> bit_pos) & 1
bit2 = (byte2 >> bit_pos) & 1
# Combine the bits to get the pixel value (0-3)
pixel_value = (bit2 << 1) | bit1
row_pixels.append(pixel_value)
pixels.append(row_pixels)
return pixels
def get_image_hash(img):
"""Generate a hash for an image to identify duplicates"""
img_bytes = io.BytesIO()
img.save(img_bytes, format="PNG")
return hashlib.md5(img_bytes.getvalue()).hexdigest()
def extract_tile_images(conn):
"""Extract 16x16 pixel tile images from the blocksets and tilesets"""
cursor = conn.cursor()
# Create directory for tile images if it doesn't exist
os.makedirs(TILE_IMAGES_DIR, exist_ok=True)
# Clean up old files
print("Cleaning up old tile images...")
old_files = list(Path(TILE_IMAGES_DIR).glob("*.png"))
for old_file in old_files:
try:
os.remove(old_file)
except Exception as e:
print(f"Error removing {old_file}: {e}")
print(f"Removed {len(old_files)} old tile images")
# Define GameBoy color palette (white, light gray, dark gray, black)
palette = [(255, 255, 255), (192, 192, 192), (96, 96, 96), (0, 0, 0)]
# Get all tilesets
cursor.execute("SELECT id, name FROM tilesets")
tilesets = cursor.fetchall()
tile_image_count = 0
unique_image_count = 0
duplicate_count = 0
total_tilesets = len(tilesets)
print(f"Processing {total_tilesets} tilesets...")
start_time = time.time()
# Dictionary to track image hashes and their corresponding IDs
image_hash_to_id = {}
# Dictionary to map (tileset_id, block_index, position) to tile_image_id
block_pos_to_image_id = {}
for i, (tileset_id, tileset_name) in enumerate(tilesets, 1):
# Update progress
sys.stdout.write(f"\rProcessing tileset {i}/{total_tilesets}: {tileset_name}")
sys.stdout.flush()
# Special case: Map DOJO (tileset ID 5) to GYM (tileset ID 7)
# This is because in the original game, DOJO uses the same graphics as GYM
query_tileset_id = 7 if tileset_id == 5 else tileset_id
# Special case: Map MART (tileset ID 2) to POKECENTER (tileset ID 6)
# This is because marts and pokecenters share similar interior graphics
if tileset_id == 2:
query_tileset_id = 6
# Get blockset data for this tileset
cursor.execute(
"""
SELECT block_index, block_data
FROM blocksets
WHERE tileset_id = ?
ORDER BY block_index
""",
(query_tileset_id,),
)
blockset_rows = cursor.fetchall()
if not blockset_rows:
continue
# Get tileset tiles
cursor.execute(
"""
SELECT tile_index, tile_data
FROM tileset_tiles
WHERE tileset_id = ?
ORDER BY tile_index
""",
(query_tileset_id,),
)
tile_rows = cursor.fetchall()
if not tile_rows:
continue
# Create dictionaries for easy lookup
blocks = {row[0]: row[1] for row in blockset_rows}
tiles = {row[0]: row[1] for row in tile_rows}
# Process each block to create 16x16 pixel images (4 per block)
for block_index, block_data in blocks.items():
# Define the 4 positions in the block (each position is 2x2 tiles)
positions = [
# Top-left: tiles at positions 0,1,4,5
[(0, 0), (0, 1), (1, 0), (1, 1)],
# Top-right: tiles at positions 2,3,6,7
[(0, 2), (0, 3), (1, 2), (1, 3)],
# Bottom-left: tiles at positions 8,9,12,13
[(2, 0), (2, 1), (3, 0), (3, 1)],
# Bottom-right: tiles at positions 10,11,14,15
[(2, 2), (2, 3), (3, 2), (3, 3)],
]
for pos_index, position in enumerate(positions):
# Create a new 16x16 image
img = Image.new("RGB", (16, 16), color=(255, 255, 255))
# Process each of the 4 tiles in this position
for i, (y, x) in enumerate(position):
# Calculate the position in the block data
tile_pos = y * 4 + x
# Get the tile index from the block data
if tile_pos < len(block_data):
tile_index = block_data[tile_pos]
else:
continue
# Get the tile data
tile_data = tiles.get(tile_index)
if not tile_data:
continue
# Decode the tile data
tile_pixels = decode_2bpp_tile(tile_data)
# Calculate where to place this tile in the 16x16 image
offset_x = (i % 2) * 8 # 0 for left tiles, 8 for right tiles
offset_y = (i // 2) * 8 # 0 for top tiles, 8 for bottom tiles
# Draw the tile
for py in range(8):
for px in range(8):
pixel_value = tile_pixels[py][px]
pixel_color = palette[pixel_value]
img.putpixel((offset_x + px, offset_y + py), pixel_color)
# Generate hash for the image
img_hash = get_image_hash(img)
# Check if we've already seen this image
if img_hash in image_hash_to_id:
# Use the existing image ID
existing_image_id = image_hash_to_id[img_hash]
block_pos_to_image_id[(tileset_id, block_index, pos_index)] = (
existing_image_id
)
# Special case: If this is the GYM tileset (ID 7), also store the mapping for DOJO (ID 5)
if tileset_id == 7:
block_pos_to_image_id[(5, block_index, pos_index)] = (
existing_image_id
)
# Special case: If this is the POKECENTER tileset (ID 6), also store the mapping for MART (ID 2)
if tileset_id == 6:
block_pos_to_image_id[(2, block_index, pos_index)] = (
existing_image_id
)
duplicate_count += 1
else:
# Save the image with a sequential number
image_path = f"{TILE_IMAGES_DIR}/tile_{unique_image_count}.png"
img.save(image_path)
# Insert the new image record
cursor.execute(
"""
INSERT INTO tile_images (tileset_id, block_index, position, image_path, image_hash)
VALUES (?, ?, ?, ?, ?)
""",
(tileset_id, block_index, pos_index, image_path, img_hash),
)
# Get the new image ID
image_id = cursor.lastrowid
image_hash_to_id[img_hash] = image_id
block_pos_to_image_id[(tileset_id, block_index, pos_index)] = (
image_id
)
# Special case: If this is the GYM tileset (ID 7), also store the mapping for DOJO (ID 5)
if tileset_id == 7:
block_pos_to_image_id[(5, block_index, pos_index)] = image_id
# Special case: If this is the POKECENTER tileset (ID 6), also store the mapping for MART (ID 2)
if tileset_id == 6:
block_pos_to_image_id[(2, block_index, pos_index)] = image_id
unique_image_count += 1
tile_image_count += 1
# Commit periodically
if unique_image_count % BATCH_SIZE == 0:
conn.commit()
conn.commit()
elapsed_time = time.time() - start_time
print(f"\nProcessed {tile_image_count} tile images")
print(f"- Unique images: {unique_image_count}")
print(f"- Duplicate images: {duplicate_count}")
print(f"- Total time: {elapsed_time:.2f} seconds")
return block_pos_to_image_id
def populate_tiles(conn, block_pos_to_image_id):
"""Populate the tiles table based on the tiles_raw and maps tables"""
cursor = conn.cursor()
# Clear the tiles table before repopulating
print("Clearing existing tiles...")
cursor.execute("DELETE FROM tiles")
conn.commit()
# Check if the tiles_raw table exists
cursor.execute(
"SELECT name FROM sqlite_master WHERE type='table' AND name='tiles_raw'"
)
has_tiles_raw = cursor.fetchone() is not None
if not has_tiles_raw:
print("Error: tiles_raw table does not exist. Please run export_map.py first.")
return
# Get all maps with their is_overworld flag
cursor.execute(
"""
SELECT id, name, width, height, tileset_id, is_overworld
FROM maps
"""
)
maps = cursor.fetchall()
total_maps = len(maps)
print(f"Processing {total_maps} maps...")
tile_count = 0
processed_maps = 0
skipped_maps = 0
skipped_map_names = []
start_time = time.time()
# Prepare for batch insert
tiles_data = []
# Get the overworld map positions if available
cursor.execute(
"SELECT name FROM sqlite_master WHERE type='table' AND name='overworld_map_positions'"
)
has_positions_table = cursor.fetchone() is not None
map_positions = {}
if has_positions_table:
cursor.execute(
"SELECT map_name, x_offset, y_offset FROM overworld_map_positions"
)
for map_name, x_offset, y_offset in cursor.fetchall():
map_positions[map_name] = (x_offset, y_offset)
# Process each map
for i, (
map_id,
map_name,
width,
height,
tileset_id,
is_overworld,
) in enumerate(maps, 1):
# Update progress every 5 maps
if i % 5 == 0 or i == total_maps:
sys.stdout.write(
f"\rProcessed {i}/{total_maps} maps, created {tile_count} tiles"
)
sys.stdout.flush()
processed_maps += 1
# Get position offsets for this map if it's an overworld map
x_offset, y_offset = 0, 0
if is_overworld and map_name in map_positions:
x_offset, y_offset = map_positions[map_name]
# Get raw tile data for this map from tiles_raw table
cursor.execute(
"""
SELECT x, y, block_index, tileset_id, is_overworld
FROM tiles_raw
WHERE map_id = ?
""",
(map_id,),
)
raw_tiles = cursor.fetchall()
if not raw_tiles:
continue
# Collect tiles for this map
map_tiles = []
# Process each raw tile
for raw_x, raw_y, block_index, raw_tileset_id, raw_is_overworld in raw_tiles:
# Special case: Map DOJO (tileset ID 5) to GYM (tileset ID 7)
# This is because in the original game, DOJO uses the same graphics as GYM
lookup_tileset_id = 7 if raw_tileset_id == 5 else raw_tileset_id
# Special case: Map MART (tileset ID 2) to POKECENTER (tileset ID 6)
# This is because marts and pokecenters share similar interior graphics
if raw_tileset_id == 2:
lookup_tileset_id = 6
# Each block corresponds to 4 tiles (2x2 grid)
# We need to create 4 entries in the tiles table
for position in range(4):
# Calculate the actual x, y coordinates for this tile
# Each block is 2x2 tiles, so we need to multiply by 2
tile_x = raw_x * 2 + (position % 2) + x_offset
tile_y = raw_y * 2 + (position // 2)
# Add y_offset if applicable (for maps with position data)
if map_name in map_positions:
tile_y += y_offset
# Get the tile_image_id from our dictionary
tile_image_id = block_pos_to_image_id.get(
(lookup_tileset_id, block_index, position)
)
if not tile_image_id:
# Try with a default position if specific position not found
tile_image_id = block_pos_to_image_id.get(
(lookup_tileset_id, block_index, 0)
)
if not tile_image_id:
continue
# Add to map tiles
map_tiles.append(
(
tile_x,
tile_y,
tile_x,
tile_y,
map_id,
tile_image_id,
is_overworld,
)
)
# Sort map tiles by y-coordinate in descending order (top to bottom becomes bottom to top)
map_tiles.sort(key=lambda t: (-t[1], t[0]))
# Add to batch insert data
tiles_data.extend(map_tiles)
tile_count += len(map_tiles)
# Execute batch insert if we've reached the batch size
if len(tiles_data) >= BATCH_SIZE:
cursor.executemany(
"""
INSERT INTO tiles (x, y, local_x, local_y, map_id, tile_image_id, is_overworld)
VALUES (?, ?, ?, ?, ?, ?, ?)
""",
tiles_data,
)
conn.commit()
tiles_data = []
# Insert any remaining tiles
if tiles_data:
cursor.executemany(
"""
INSERT INTO tiles (x, y, local_x, local_y, map_id, tile_image_id, is_overworld)
VALUES (?, ?, ?, ?, ?, ?, ?)
""",
tiles_data,
)
conn.commit()
elapsed_time = time.time() - start_time
print(
f"\nCreated {tile_count} tiles from {processed_maps} maps in {elapsed_time:.2f} seconds"
)
def main():
"""Main function"""
total_start_time = time.time()
print("Creating new tables...")
conn = create_new_tables()
print("\nExtracting tile images...")
block_pos_to_image_id = extract_tile_images(conn)
print("\nPopulating tiles table...")
populate_tiles(conn, block_pos_to_image_id)
# Print summary
cursor = conn.cursor()
cursor.execute("SELECT COUNT(*) FROM tile_images")
tile_image_count = cursor.fetchone()[0]
cursor.execute("SELECT COUNT(*) FROM tiles")
tile_count = cursor.fetchone()[0]
total_elapsed_time = time.time() - total_start_time
print("\nSummary:")
print(f"- Extracted {tile_image_count} unique tile images")
print(f"- Created {tile_count} tiles")
print(f"- Total time: {total_elapsed_time:.2f} seconds")
print("\nDone!")
conn.close()
if __name__ == "__main__":
main()