2016-08-12 18:34:11 -07:00
""" Extract all the juicy details from a Gen I game.
This was a pain in the ass ! Thank you SO MUCH to :
pokered
pokeyellow
vixie
http : / / www . pastraiser . com / cpu / gameboy / gameboy_opcodes . html
"""
# TODO fix that docstring
# TODO note terminology somewhere: id, index, identifier
2016-09-10 18:05:41 -07:00
from collections import defaultdict
2016-08-12 18:34:11 -07:00
from collections import OrderedDict
import hashlib
import io
import logging
from pathlib import Path
import sys
2016-08-14 00:15:30 -07:00
from camel import Camel
2016-08-12 18:34:11 -07:00
from classtools import reify
from construct import *
2016-08-21 16:44:07 -07:00
from pokedex . extract . lib . gbz80 import find_code
2016-08-12 18:34:11 -07:00
import pokedex . schema as schema
2016-09-10 21:23:57 -07:00
# TODO set this up to colorcode, probably put that... elsewhere
2016-08-12 18:34:11 -07:00
log = logging . getLogger ( __name__ )
# Known official games, the languages they were released in, and hashes of
# their contents
GAME_RELEASE_MD5SUMS = {
# Set 0: Original Red/Green, only released in Japan
' jp-red ' : {
' ja ' : [
' 912d4f77d118390a2e2c42b2016a19d4 ' , # original
' 4c44844f8d5aa3305a0cf2c95cf96333 ' , # revision A
] ,
} ,
' jp-green ' : {
' ja ' : [
' e30ffbab1f239f09b226477d84db1368 ' , # original
' 16ddd8897092936fbc0e286c6a6b23a2 ' , # revision A
] ,
} ,
# Set 1: Blue in Japan, split into Red and Blue worldwide
' jp-blue ' : {
' ja ' : [ ' c1adf0a77809ac91d905a4828888a2f0 ' ] ,
} ,
' ww-red ' : {
' de ' : [ ' 8ed0e8d45a81ca34de625d930148a512 ' ] ,
' en ' : [ ' 3d45c1ee9abd5738df46d2bdda8b57dc ' ] ,
' es ' : [ ' 463c241c8721ab1d1da17c91de9f8a32 ' ] ,
' fr ' : [ ' 669700657cb06ed09371cdbdef69e8a3 ' ] ,
' it ' : [ ' 6468fb0652dde30eb968a44f17c686f1 ' ] ,
} ,
' ww-blue ' : {
' de ' : [ ' a1ec7f07c7b4251d5fafc50622d546f8 ' ] ,
' en ' : [ ' 50927e843568814f7ed45ec4f944bd8b ' ] ,
' es ' : [ ' 6e7663f908334724548a66fc9c386002 ' ] ,
' fr ' : [ ' 35c8154c81abb2ab850689fd28a03515 ' ] ,
' it ' : [ ' ebe0742b472b3e80a9c6749f06181073 ' ] ,
} ,
# Set 2: Yellow, pretty much the same everywhere
# TODO is that true?
# TODO missing other languages
' yellow ' : {
' en ' : [ ' d9290db87b1f0a23b89f99ee4469e34b ' ] ,
' ja ' : [
' aa13e886a47fd473da63b7d5ddf2828d ' , # original
' 96c1f411671b6e1761cf31884dde0dbb ' , # revision A
' 5d9c071cf6eb5f3a697bbcd9311b4d04 ' , # revision B
] ,
}
}
# Same, but rearranged to md5 => (game, language)
GAME_RELEASE_MD5SUM_INDEX = {
md5sum : ( game , language )
for ( game , language_sums ) in GAME_RELEASE_MD5SUMS . items ( )
for ( language , md5sums ) in language_sums . items ( )
for md5sum in md5sums
}
# ------------------------------------------------------------------------------
# Game structure stuff
#
# A lot of this was made much, much easier by the work done on pokered:
# https://github.com/pret/pokered
# Thank y'all so much!
# TODO possibly some of this should be in a shared place, not this file
GROWTH_RATES = {
2016-08-14 00:15:30 -07:00
0 : ' growth-rate.medium ' ,
3 : ' growth-rate.medium-slow ' ,
4 : ' growth-rate.fast ' ,
5 : ' growth-rate.slow ' ,
2016-08-12 18:34:11 -07:00
}
EVOLUTION_TRIGGERS = {
2016-08-14 00:15:30 -07:00
1 : ' evolution-trigger.level-up ' ,
2 : ' evolution-trigger.use-item ' ,
3 : ' evolution-trigger.trade ' ,
2016-08-12 18:34:11 -07:00
}
# TODO these are loci, not enums, so hardcoding all their identifiers here
# makes me nonspecifically uncomfortable
POKEMON_IDENTIFIERS = {
2016-08-14 00:15:30 -07:00
1 : ' pokemon.bulbasaur ' ,
2 : ' pokemon.ivysaur ' ,
3 : ' pokemon.venusaur ' ,
4 : ' pokemon.charmander ' ,
5 : ' pokemon.charmeleon ' ,
6 : ' pokemon.charizard ' ,
7 : ' pokemon.squirtle ' ,
8 : ' pokemon.wartortle ' ,
9 : ' pokemon.blastoise ' ,
10 : ' pokemon.caterpie ' ,
11 : ' pokemon.metapod ' ,
12 : ' pokemon.butterfree ' ,
13 : ' pokemon.weedle ' ,
14 : ' pokemon.kakuna ' ,
15 : ' pokemon.beedrill ' ,
16 : ' pokemon.pidgey ' ,
17 : ' pokemon.pidgeotto ' ,
18 : ' pokemon.pidgeot ' ,
19 : ' pokemon.rattata ' ,
20 : ' pokemon.raticate ' ,
21 : ' pokemon.spearow ' ,
22 : ' pokemon.fearow ' ,
23 : ' pokemon.ekans ' ,
24 : ' pokemon.arbok ' ,
25 : ' pokemon.pikachu ' ,
26 : ' pokemon.raichu ' ,
27 : ' pokemon.sandshrew ' ,
28 : ' pokemon.sandslash ' ,
29 : ' pokemon.nidoran-f ' ,
30 : ' pokemon.nidorina ' ,
31 : ' pokemon.nidoqueen ' ,
32 : ' pokemon.nidoran-m ' ,
33 : ' pokemon.nidorino ' ,
34 : ' pokemon.nidoking ' ,
35 : ' pokemon.clefairy ' ,
36 : ' pokemon.clefable ' ,
37 : ' pokemon.vulpix ' ,
38 : ' pokemon.ninetales ' ,
39 : ' pokemon.jigglypuff ' ,
40 : ' pokemon.wigglytuff ' ,
41 : ' pokemon.zubat ' ,
42 : ' pokemon.golbat ' ,
43 : ' pokemon.oddish ' ,
44 : ' pokemon.gloom ' ,
45 : ' pokemon.vileplume ' ,
46 : ' pokemon.paras ' ,
47 : ' pokemon.parasect ' ,
48 : ' pokemon.venonat ' ,
49 : ' pokemon.venomoth ' ,
50 : ' pokemon.diglett ' ,
51 : ' pokemon.dugtrio ' ,
52 : ' pokemon.meowth ' ,
53 : ' pokemon.persian ' ,
54 : ' pokemon.psyduck ' ,
55 : ' pokemon.golduck ' ,
56 : ' pokemon.mankey ' ,
57 : ' pokemon.primeape ' ,
58 : ' pokemon.growlithe ' ,
59 : ' pokemon.arcanine ' ,
60 : ' pokemon.poliwag ' ,
61 : ' pokemon.poliwhirl ' ,
62 : ' pokemon.poliwrath ' ,
63 : ' pokemon.abra ' ,
64 : ' pokemon.kadabra ' ,
65 : ' pokemon.alakazam ' ,
66 : ' pokemon.machop ' ,
67 : ' pokemon.machoke ' ,
68 : ' pokemon.machamp ' ,
69 : ' pokemon.bellsprout ' ,
70 : ' pokemon.weepinbell ' ,
71 : ' pokemon.victreebel ' ,
72 : ' pokemon.tentacool ' ,
73 : ' pokemon.tentacruel ' ,
74 : ' pokemon.geodude ' ,
75 : ' pokemon.graveler ' ,
76 : ' pokemon.golem ' ,
77 : ' pokemon.ponyta ' ,
78 : ' pokemon.rapidash ' ,
79 : ' pokemon.slowpoke ' ,
80 : ' pokemon.slowbro ' ,
81 : ' pokemon.magnemite ' ,
82 : ' pokemon.magneton ' ,
83 : ' pokemon.farfetchd ' ,
84 : ' pokemon.doduo ' ,
85 : ' pokemon.dodrio ' ,
86 : ' pokemon.seel ' ,
87 : ' pokemon.dewgong ' ,
88 : ' pokemon.grimer ' ,
89 : ' pokemon.muk ' ,
90 : ' pokemon.shellder ' ,
91 : ' pokemon.cloyster ' ,
92 : ' pokemon.gastly ' ,
93 : ' pokemon.haunter ' ,
94 : ' pokemon.gengar ' ,
95 : ' pokemon.onix ' ,
96 : ' pokemon.drowzee ' ,
97 : ' pokemon.hypno ' ,
98 : ' pokemon.krabby ' ,
99 : ' pokemon.kingler ' ,
100 : ' pokemon.voltorb ' ,
101 : ' pokemon.electrode ' ,
102 : ' pokemon.exeggcute ' ,
103 : ' pokemon.exeggutor ' ,
104 : ' pokemon.cubone ' ,
105 : ' pokemon.marowak ' ,
106 : ' pokemon.hitmonlee ' ,
107 : ' pokemon.hitmonchan ' ,
108 : ' pokemon.lickitung ' ,
109 : ' pokemon.koffing ' ,
110 : ' pokemon.weezing ' ,
111 : ' pokemon.rhyhorn ' ,
112 : ' pokemon.rhydon ' ,
113 : ' pokemon.chansey ' ,
114 : ' pokemon.tangela ' ,
115 : ' pokemon.kangaskhan ' ,
116 : ' pokemon.horsea ' ,
117 : ' pokemon.seadra ' ,
118 : ' pokemon.goldeen ' ,
119 : ' pokemon.seaking ' ,
120 : ' pokemon.staryu ' ,
121 : ' pokemon.starmie ' ,
122 : ' pokemon.mr-mime ' ,
123 : ' pokemon.scyther ' ,
124 : ' pokemon.jynx ' ,
125 : ' pokemon.electabuzz ' ,
126 : ' pokemon.magmar ' ,
127 : ' pokemon.pinsir ' ,
128 : ' pokemon.tauros ' ,
129 : ' pokemon.magikarp ' ,
130 : ' pokemon.gyarados ' ,
131 : ' pokemon.lapras ' ,
132 : ' pokemon.ditto ' ,
133 : ' pokemon.eevee ' ,
134 : ' pokemon.vaporeon ' ,
135 : ' pokemon.jolteon ' ,
136 : ' pokemon.flareon ' ,
137 : ' pokemon.porygon ' ,
138 : ' pokemon.omanyte ' ,
139 : ' pokemon.omastar ' ,
140 : ' pokemon.kabuto ' ,
141 : ' pokemon.kabutops ' ,
142 : ' pokemon.aerodactyl ' ,
143 : ' pokemon.snorlax ' ,
144 : ' pokemon.articuno ' ,
145 : ' pokemon.zapdos ' ,
146 : ' pokemon.moltres ' ,
147 : ' pokemon.dratini ' ,
148 : ' pokemon.dragonair ' ,
149 : ' pokemon.dragonite ' ,
150 : ' pokemon.mewtwo ' ,
151 : ' pokemon.mew ' ,
2016-08-12 18:34:11 -07:00
}
TYPE_IDENTIFIERS = {
2016-08-14 00:15:30 -07:00
0 : ' type.normal ' ,
1 : ' type.fighting ' ,
2 : ' type.flying ' ,
3 : ' type.poison ' ,
4 : ' type.ground ' ,
5 : ' type.rock ' ,
#6: 'type.bird',
7 : ' type.bug ' ,
8 : ' type.ghost ' ,
9 : ' type.steel ' ,
20 : ' type.fire ' ,
21 : ' type.water ' ,
22 : ' type.grass ' ,
23 : ' type.electric ' ,
24 : ' type.psychic ' ,
25 : ' type.ice ' ,
26 : ' type.dragon ' ,
27 : ' type.dark ' ,
2016-08-12 18:34:11 -07:00
}
MOVE_IDENTIFIERS = {
# TODO stupid hack for initial moveset
0 : ' -- ' ,
2016-08-14 00:15:30 -07:00
1 : ' move.pound ' ,
2 : ' move.karate-chop ' ,
3 : ' move.double-slap ' ,
4 : ' move.comet-punch ' ,
5 : ' move.mega-punch ' ,
6 : ' move.pay-day ' ,
7 : ' move.fire-punch ' ,
8 : ' move.ice-punch ' ,
9 : ' move.thunder-punch ' ,
10 : ' move.scratch ' ,
11 : ' move.vice-grip ' ,
12 : ' move.guillotine ' ,
13 : ' move.razor-wind ' ,
14 : ' move.swords-dance ' ,
15 : ' move.cut ' ,
16 : ' move.gust ' ,
17 : ' move.wing-attack ' ,
18 : ' move.whirlwind ' ,
19 : ' move.fly ' ,
20 : ' move.bind ' ,
21 : ' move.slam ' ,
22 : ' move.vine-whip ' ,
23 : ' move.stomp ' ,
24 : ' move.double-kick ' ,
25 : ' move.mega-kick ' ,
26 : ' move.jump-kick ' ,
27 : ' move.rolling-kick ' ,
28 : ' move.sand-attack ' ,
29 : ' move.headbutt ' ,
30 : ' move.horn-attack ' ,
31 : ' move.fury-attack ' ,
32 : ' move.horn-drill ' ,
33 : ' move.tackle ' ,
34 : ' move.body-slam ' ,
35 : ' move.wrap ' ,
36 : ' move.take-down ' ,
37 : ' move.thrash ' ,
38 : ' move.double-edge ' ,
39 : ' move.tail-whip ' ,
40 : ' move.poison-sting ' ,
41 : ' move.twineedle ' ,
42 : ' move.pin-missile ' ,
43 : ' move.leer ' ,
44 : ' move.bite ' ,
45 : ' move.growl ' ,
46 : ' move.roar ' ,
47 : ' move.sing ' ,
48 : ' move.supersonic ' ,
49 : ' move.sonic-boom ' ,
50 : ' move.disable ' ,
51 : ' move.acid ' ,
52 : ' move.ember ' ,
53 : ' move.flamethrower ' ,
54 : ' move.mist ' ,
55 : ' move.water-gun ' ,
56 : ' move.hydro-pump ' ,
57 : ' move.surf ' ,
58 : ' move.ice-beam ' ,
59 : ' move.blizzard ' ,
60 : ' move.psybeam ' ,
61 : ' move.bubble-beam ' ,
62 : ' move.aurora-beam ' ,
63 : ' move.hyper-beam ' ,
64 : ' move.peck ' ,
65 : ' move.drill-peck ' ,
66 : ' move.submission ' ,
67 : ' move.low-kick ' ,
68 : ' move.counter ' ,
69 : ' move.seismic-toss ' ,
70 : ' move.strength ' ,
71 : ' move.absorb ' ,
72 : ' move.mega-drain ' ,
73 : ' move.leech-seed ' ,
74 : ' move.growth ' ,
75 : ' move.razor-leaf ' ,
76 : ' move.solar-beam ' ,
77 : ' move.poison-powder ' ,
78 : ' move.stun-spore ' ,
79 : ' move.sleep-powder ' ,
80 : ' move.petal-dance ' ,
81 : ' move.string-shot ' ,
82 : ' move.dragon-rage ' ,
83 : ' move.fire-spin ' ,
84 : ' move.thunder-shock ' ,
85 : ' move.thunderbolt ' ,
86 : ' move.thunder-wave ' ,
87 : ' move.thunder ' ,
88 : ' move.rock-throw ' ,
89 : ' move.earthquake ' ,
90 : ' move.fissure ' ,
91 : ' move.dig ' ,
92 : ' move.toxic ' ,
93 : ' move.confusion ' ,
94 : ' move.psychic ' ,
95 : ' move.hypnosis ' ,
96 : ' move.meditate ' ,
97 : ' move.agility ' ,
98 : ' move.quick-attack ' ,
99 : ' move.rage ' ,
100 : ' move.teleport ' ,
101 : ' move.night-shade ' ,
102 : ' move.mimic ' ,
103 : ' move.screech ' ,
104 : ' move.double-team ' ,
105 : ' move.recover ' ,
106 : ' move.harden ' ,
107 : ' move.minimize ' ,
108 : ' move.smokescreen ' ,
109 : ' move.confuse-ray ' ,
110 : ' move.withdraw ' ,
111 : ' move.defense-curl ' ,
112 : ' move.barrier ' ,
113 : ' move.light-screen ' ,
114 : ' move.haze ' ,
115 : ' move.reflect ' ,
116 : ' move.focus-energy ' ,
117 : ' move.bide ' ,
118 : ' move.metronome ' ,
119 : ' move.mirror-move ' ,
120 : ' move.self-destruct ' ,
121 : ' move.egg-bomb ' ,
122 : ' move.lick ' ,
123 : ' move.smog ' ,
124 : ' move.sludge ' ,
125 : ' move.bone-club ' ,
126 : ' move.fire-blast ' ,
127 : ' move.waterfall ' ,
128 : ' move.clamp ' ,
129 : ' move.swift ' ,
130 : ' move.skull-bash ' ,
131 : ' move.spike-cannon ' ,
132 : ' move.constrict ' ,
133 : ' move.amnesia ' ,
134 : ' move.kinesis ' ,
135 : ' move.soft-boiled ' ,
136 : ' move.high-jump-kick ' ,
137 : ' move.glare ' ,
138 : ' move.dream-eater ' ,
139 : ' move.poison-gas ' ,
140 : ' move.barrage ' ,
141 : ' move.leech-life ' ,
142 : ' move.lovely-kiss ' ,
143 : ' move.sky-attack ' ,
144 : ' move.transform ' ,
145 : ' move.bubble ' ,
146 : ' move.dizzy-punch ' ,
147 : ' move.spore ' ,
148 : ' move.flash ' ,
149 : ' move.psywave ' ,
150 : ' move.splash ' ,
151 : ' move.acid-armor ' ,
152 : ' move.crabhammer ' ,
153 : ' move.explosion ' ,
154 : ' move.fury-swipes ' ,
155 : ' move.bonemerang ' ,
156 : ' move.rest ' ,
157 : ' move.rock-slide ' ,
158 : ' move.hyper-fang ' ,
159 : ' move.sharpen ' ,
160 : ' move.conversion ' ,
161 : ' move.tri-attack ' ,
162 : ' move.super-fang ' ,
163 : ' move.slash ' ,
164 : ' move.substitute ' ,
165 : ' move.struggle ' ,
2016-08-12 18:34:11 -07:00
}
def unbank ( * args ) :
""" Convert a " bank " identifier, XX:YYYY, to a real address. The Game Boy
is all about banks internally , and it ' s what pokered uses, so I ' ve kept
them intact in this file .
The scheme is fairly simple :
- XX is the bank ; YYYY is an address . Banks are 0x4000 bytes .
- For bank 00 , YYYY is already a real address , and should be between 0x0000
and 0x4000 .
- For any other bank , YYYY is between 0x4000 and 0x8000 , and they ' re just
arranged in order . So for bank 01 , YYYY is already a real address ; for
bank 02 , you add 0x4000 ; and so on .
Accepts either two ints ( XX and YYYY ) or a string in the form ' XX:YYYY ' .
"""
if len ( args ) == 1 :
banked_address , = args
banks , addrs = banked_address . split ( ' : ' )
bank = int ( banks , 16 )
addr = int ( addrs , 16 )
else :
bank , addr = args
if bank :
assert 0x4000 < = addr < 0x8000
return addr + ( bank - 1 ) * 0x4000
else :
assert 0 < = addr < 0x4000
return addr
def bank ( addr ) :
""" Inverse of the above transformation. """
if addr < 0x4000 :
return 0 , addr
bank , addr = divmod ( addr , 0x4000 )
addr + = 0x4000
return bank , addr
2016-09-10 21:23:57 -07:00
JA_CHARMAP = dict ( enumerate ( [
# 0x
# 00 appears at the beginning of a lot of Pokédex entries?
" " , " イ゛ " , " ヴ " , " エ゛ " , " オ゛ " , " ガ " , " ギ " , " グ " ,
" ゲ " , " ゴ " , " ザ " , " ジ " , " ズ " , " ゼ " , " ゾ " , " ダ " ,
# 1x
" ヂ " , " ヅ " , " デ " , " ド " , " ナ゛ " , " ニ゛ " , " ヌ゛ " , " ネ゛ " ,
" ノ゛ " , " バ " , " ビ " , " ブ " , " ボ " , " マ゛ " , " ミ゛ " , " ム゛ " ,
# 2x
" ィ゛ " , " あ゛ " , " い゛ " , " ゔ " , " え゛ " , " お゛ " , " が " , " ぎ " ,
" ぐ " , " げ " , " ご " , " ざ " , " じ " , " ず " , " ぜ " , " ぞ " ,
# 3x
" だ " , " ぢ " , " づ " , " で " , " ど " , " な゛ " , " に゛ " , " ぬ゛ " ,
" ね゛ " , " の゛ " , " ば " , " び " , " ぶ " , " べ " , " ぼ " , " ま゛ " ,
# 4x
# 4F is the Pokédex newline
# 4E is the dialogue newline (puts the cursor on the bottom line)
" パ " , " ピ " , " プ " , " ポ " , " ぱ " , " ぴ " , " ぷ " , " ぺ " ,
" ぽ " , " \f " , " が " , " も゜ " , " <EFBFBD> " , " <EFBFBD> " , " \n " , " \n " ,
# 5x
# 50 is the string terminator, represented by @ in pokered
# 51 prompts for a button press, then clears the screen
# 52 is the player's name
# 53 is the rival's name
# 55 prompts for a button press, then scrolls up one line
# 57 ends dialogue, invisibly
# 58 ends dialogue, visibly
# 59 is the inactive Pokémon in battle
# 5A is the active Pokémon in battle
# 5F marks the end of a Pokédex entry, which automaticaly adds a period
" @ " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " ポケモン " , " <EFBFBD> " , " …… " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " パソコン " , " わざマシン " , " トレーナー " , " ロケットだん " , " 。 " ,
# 6x
" A " , " B " , " C " , " D " , " E " , " F " , " G " , " H " ,
" I " , " V " , " S " , " L " , " M " , " : " , " ぃ " , " ぅ " ,
# 7x
# 79 - 7E are the TL, T/B, TR, L/R, BL, and BR of the text box
" 「 " , " 」 " , " 『 " , " 』 " , " ・ " , " … " , " ぁ " , " ぇ " ,
" ぉ " , " ╔ " , " ═ " , " ╗ " , " ║ " , " ╚ " , " ╝ " , " " ,
# 8x
" ア " , " イ " , " ウ " , " エ " , " オ " , " カ " , " キ " , " ク " ,
" ケ " , " コ " , " サ " , " シ " , " ス " , " セ " , " ソ " , " タ " ,
# 9x
" チ " , " ツ " , " テ " , " ト " , " ナ " , " ニ " , " ヌ " , " ネ " ,
" ノ " , " ハ " , " ヒ " , " フ " , " ホ " , " マ " , " ミ " , " ム " ,
# Ax
" メ " , " モ " , " ヤ " , " ユ " , " ヨ " , " ラ " , " ル " , " レ " ,
" ロ " , " ワ " , " ヲ " , " ン " , " ッ " , " ャ " , " ュ " , " ョ " ,
# Bx
" ィ " , " あ " , " い " , " う " , " え " , " お " , " か " , " き " ,
" く " , " け " , " こ " , " さ " , " し " , " す " , " せ " , " そ " ,
# Cx
" た " , " ち " , " つ " , " て " , " と " , " な " , " に " , " ぬ " ,
" ね " , " の " , " は " , " ひ " , " ふ " , " へ " , " ほ " , " ま " ,
# Dx
" み " , " む " , " め " , " も " , " や " , " ゆ " , " よ " , " ら " ,
" り " , " る " , " れ " , " ろ " , " わ " , " を " , " ん " , " っ " ,
# Ex
" ゃ " , " ゅ " , " ょ " , " ー " , " ゜ " , " ゛ " , " ? " , " ! " ,
" 。 " , " ァ " , " ゥ " , " ェ " , " ▷ " , " ▶ " , " ▼ " , " ♂ " ,
# Fx
" 円 " , " × " , " . " , " / " , " ォ " , " ♀ " , " 0 " , " 1 " ,
" 2 " , " 3 " , " 4 " , " 5 " , " 6 " , " 7 " , " 8 " , " 9 " ,
] ) )
2016-08-12 18:34:11 -07:00
2016-09-10 21:23:57 -07:00
EN_CHARMAP = dict ( enumerate ( [
2016-08-12 18:34:11 -07:00
# 0x0X
2016-09-10 21:23:57 -07:00
" " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-08-12 18:34:11 -07:00
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x1X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x2X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x3X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-09-10 21:23:57 -07:00
# 4x
2016-08-12 18:34:11 -07:00
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-09-10 21:23:57 -07:00
" <EFBFBD> " , " \f " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " \n " , " \n " ,
# 5x
" @ " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " POKé " , " <EFBFBD> " , " …… " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " PC " , " TM " , " TRAINER " , " ROCKET " , " . " ,
# 6x
" A " , " B " , " C " , " D " , " E " , " F " , " G " , " H " ,
" I " , " V " , " S " , " L " , " M " , " : " , " ぃ " , " ぅ " ,
# 7x
" ‘ " , " ’ " , " “ " , " ” " , " ・ " , " … " , " ぁ " , " ぇ " ,
" ぉ " , " ╔ " , " ═ " , " ╗ " , " ║ " , " ╚ " , " ╝ " , " " ,
# 8x
" A " , " B " , " C " , " D " , " E " , " F " , " G " , " H " ,
" I " , " J " , " K " , " L " , " M " , " N " , " O " , " P " ,
# 9x
" Q " , " R " , " S " , " T " , " U " , " V " , " W " , " X " ,
" Y " , " Z " , " ( " , " ) " , " : " , " ; " , " [ " , " ] " ,
# Ax
" a " , " b " , " c " , " d " , " e " , " f " , " g " , " h " ,
" i " , " j " , " k " , " l " , " m " , " n " , " o " , " p " ,
# Bx
" q " , " r " , " s " , " t " , " u " , " v " , " w " , " x " ,
" y " , " z " , " é " , " ʼ d" , " ʼ l" , " ʼ s" , " ʼ t" , " ʼ v" ,
# Cx
2016-08-12 18:34:11 -07:00
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-09-10 21:23:57 -07:00
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# Dx
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# Ex
" ' " , " ᴾₖ " , " ᴹₙ " , " - " , " ʼ r" , " ʼ m" , " ? " , " ! " ,
" . " , " ァ " , " ゥ " , " ェ " , " ▷ " , " ▶ " , " ▼ " , " ♂ " ,
# Fx
# F0 is the currency symbol; this is the ruble sign, close enough
" ₽ " , " × " , " . " , " / " , " , " , " ♀ " , " 0 " , " 1 " ,
" 2 " , " 3 " , " 4 " , " 5 " , " 6 " , " 7 " , " 8 " , " 9 " ,
] ) )
# ty, tachyon
DE_FR_CHARMAP = dict ( enumerate ( [
# 0x0X
2016-08-12 18:34:11 -07:00
" " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-09-10 21:23:57 -07:00
# 0x1X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x2X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x3X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 4x
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " \f " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " \n " , " \n " ,
# 5x
" @ " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " POKé " , " <EFBFBD> " , " …… " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-08-12 18:34:11 -07:00
# 0x6X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x7X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " " ,
# 0x8X
" A " , " B " , " C " , " D " , " E " , " F " , " G " , " H " ,
" I " , " J " , " K " , " L " , " M " , " N " , " O " , " P " ,
# 0x9X
" Q " , " R " , " S " , " T " , " U " , " V " , " W " , " X " ,
" Y " , " Z " , " ( " , " ) " , " : " , " ; " , " [ " , " ] " ,
# 0xAX
" a " , " b " , " c " , " d " , " e " , " f " , " g " , " h " ,
" i " , " j " , " k " , " l " , " m " , " n " , " o " , " p " ,
# 0xBX
" q " , " r " , " s " , " t " , " u " , " v " , " w " , " x " ,
" y " , " z " , " à " , " è " , " é " , " ù " , " ß " , " ç " ,
# 0xCX
" Ä " , " Ö " , " Ü " , " ä " , " ö " , " ü " , " ë " , " ï " ,
" â " , " ô " , " û " , " ê " , " î " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0xDX
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " cʼ " , " dʼ " , " jʼ " , " lʼ " ,
" mʼ " , " nʼ " , " pʼ " , " sʼ " , " ʼ s" , " tʼ " , " uʼ " , " yʼ " ,
# 0xEX
2016-09-10 21:23:57 -07:00
" ' " , " ᴾₖ " , " ᴹₙ " , " - " , " ¿ " , " ¡ " , " ? " , " ! " ,
2016-08-12 18:34:11 -07:00
" . " , " ァ " , " ゥ " , " ェ " , " ▹ " , " ▸ " , " ▾ " , " ♂ " ,
# 0xFX
" $ " , " × " , " . " , " / " , " , " , " ♀ " , " 0 " , " 1 " ,
" 2 " , " 3 " , " 4 " , " 5 " , " 6 " , " 7 " , " 8 " , " 9 " ,
] ) )
ES_IT_CHARMAP = dict ( enumerate ( [
# 0x0X
2016-09-10 21:23:57 -07:00
" " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-08-12 18:34:11 -07:00
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x1X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x2X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x3X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-09-10 21:23:57 -07:00
# 4x
2016-08-12 18:34:11 -07:00
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
2016-09-10 21:23:57 -07:00
" <EFBFBD> " , " \f " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " \n " , " \n " ,
# 5x
" @ " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " POKé " , " <EFBFBD> " , " …… " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " . " ,
2016-08-12 18:34:11 -07:00
# 0x6X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
# 0x7X
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " ,
" <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " <EFBFBD> " , " " ,
# 0x8X
" A " , " B " , " C " , " D " , " E " , " F " , " G " , " H " ,
" I " , " J " , " K " , " L " , " M " , " N " , " O " , " P " ,
# 0x9X
" Q " , " R " , " S " , " T " , " U " , " V " , " W " , " X " ,
" Y " , " Z " , " ( " , " ) " , " : " , " ; " , " [ " , " ] " ,
# 0xAX
" a " , " b " , " c " , " d " , " e " , " f " , " g " , " h " ,
" i " , " j " , " k " , " l " , " m " , " n " , " o " , " p " ,
# 0xBX
" q " , " r " , " s " , " t " , " u " , " v " , " w " , " x " ,
" y " , " z " , " à " , " è " , " é " , " ù " , " À " , " Á " ,
# 0xCX
" Ä " , " Ö " , " Ü " , " ä " , " ö " , " ü " , " È " , " É " ,
" Ì " , " Í " , " Ñ " , " Ò " , " Ó " , " Ù " , " Ú " , " á " ,
# 0xDX
" ì " , " í " , " ñ " , " ò " , " ó " , " ú " , " º " , " & " ,
" ʼ d" , " ʼ l" , " ʼ m" , " ʼ r" , " ʼ s" , " ʼ t" , " ʼ v" , " " ,
# 0xEX
2016-09-10 21:23:57 -07:00
" ' " , " ᴾₖ " , " ᴹₙ " , " - " , " ¿ " , " ¡ " , " ? " , " ! " ,
2016-08-12 18:34:11 -07:00
" . " , " ァ " , " ゥ " , " ェ " , " ▹ " , " ▸ " , " ▾ " , " ♂ " ,
# 0xFX
" $ " , " × " , " . " , " / " , " , " , " ♀ " , " 0 " , " 1 " ,
2016-09-10 21:23:57 -07:00
" 2 " , " 3 " , " 4 " , " 5 " , " 6 " , " 7 " , " 8 " , " 9 " ,
2016-08-12 18:34:11 -07:00
] ) )
2016-09-10 21:23:57 -07:00
CHARACTER_MAPS = dict (
ja = JA_CHARMAP ,
en = EN_CHARMAP ,
es = ES_IT_CHARMAP ,
it = ES_IT_CHARMAP ,
de = DE_FR_CHARMAP ,
fr = DE_FR_CHARMAP ,
)
2016-08-12 18:34:11 -07:00
class PokemonString :
""" A string encoded using the goofy Gen I scheme. """
def __init__ ( self , raw ) :
self . raw = raw
def decrypt ( self , language ) :
2016-09-10 21:23:57 -07:00
try :
charmap = CHARACTER_MAPS [ language ]
except KeyError :
2016-08-12 18:34:11 -07:00
raise ValueError ( " Not a known language: {!r} " . format ( language ) )
return ' ' . join (
charmap . get ( ch , ' <EFBFBD> ' ) for ch in self . raw )
class PokemonCString ( Adapter ) :
""" Construct thing for `PokemonString`. """
def __init__ ( self , name , length = None ) :
# No matter which charmap, the "end of string" character is always
# encoded as P
if length is None :
subcon = CString ( name , terminators = b ' P ' )
else :
subcon = String ( name , length , padchar = b ' P ' )
super ( ) . __init__ ( subcon )
def _encode ( self , obj , context ) :
raise NotImplementedError
def _decode ( self , obj , context ) :
return PokemonString ( obj )
2016-09-10 21:23:57 -07:00
class MacroPokemonCString ( Construct ) :
""" Similar to the above, but for strings that may contain the 0x17 " far
load " macro, whose parameters may in turn contain the NUL byte 0x50 without
marking the end of the string . Yikes . """
def _parse ( self , stream , context ) :
buf = bytearray ( )
while True :
byte , = stream . read ( 1 )
if byte == 0x17 :
# "Far load"
addr_lo , addr_hi , bank = stream . read ( 3 )
offset = unbank ( bank , addr_lo + addr_hi * 256 )
pos = stream . tell ( )
try :
stream . seek ( offset )
buf . extend ( self . _parse ( stream , context ) . raw )
finally :
stream . seek ( pos )
elif byte == 0x50 :
break
elif byte == 0x5F :
# 5F ends a Pokédex entry
buf . append ( byte )
break
else :
buf . append ( byte )
return PokemonString ( bytes ( buf ) )
2016-08-12 18:34:11 -07:00
class NullTerminatedArray ( Subconstruct ) :
_peeker = Peek ( ULInt8 ( ' ___ ' ) )
__slots__ = ( )
def __init__ ( self , subcon ) :
super ( ) . __init__ ( subcon )
self . _clear_flag ( self . FLAG_COPY_CONTEXT )
self . _set_flag ( self . FLAG_DYNAMIC )
def _parse ( self , stream , context ) :
from construct . lib import ListContainer
obj = ListContainer ( )
orig_context = context
while True :
nextbyte = self . _peeker . parse_stream ( stream )
if nextbyte == 0 :
break
if self . subcon . conflags & self . FLAG_COPY_CONTEXT :
context = orig_context . __copy__ ( )
# TODO what if we hit the end of the stream
obj . append ( self . subcon . _parse ( stream , context ) )
# Consume the trailing zero
stream . read ( 1 )
return obj
def _build ( self , obj , stream , context ) :
raise NotImplementedError
# TODO ???
#def _sizeof(self, context):
def IdentEnum ( subcon , mapping ) :
return Enum ( subcon , * * { v : k for ( k , v ) in mapping . items ( ) } )
# Game Boy header, at 0x0100
# http://gbdev.gg8.se/wiki/articles/The_Cartridge_Header
# TODO hey! i wish i had a little cli entry point that would spit this out for a game. and do other stuff like scan for likely pokemon text or graphics. that would be really cool in fact. maybe put this in a gb module and make that exist sometime.
game_boy_header_struct = Struct (
' game_boy_header ' ,
# Entry point for the game; generally contains a jump to 0x0150
String ( ' entry_point ' , 4 ) ,
# Nintendo logo; must be exactly this or booting will not continue
Const (
String ( ' nintendo_logo ' , 48 ) ,
bytes . fromhex ( """
CE ED 66 66 CC 0 D 00 0 B 03 73 00 83 00 0 C 00 0 D
00 08 11 1 F 88 89 00 0 E DC CC 6 E E6 DD DD D9 99
BB BB 67 63 6 E 0 E EC CC DD DC 99 9 F BB B9 33 3 E
""" .replace( ' \n ' , ' ' )),
) ,
String ( ' title ' , 11 , padchar = b ' \x00 ' ) ,
String ( ' manufacturer_code ' , 4 ) ,
ULInt8 ( ' cgb_flag ' ) ,
String ( ' new_licensee_code ' , 2 ) ,
ULInt8 ( ' sgb_flag ' ) , # 3 for super game boy support
ULInt8 ( ' cartridge_type ' ) ,
ULInt8 ( ' rom_size ' ) ,
ULInt8 ( ' ram_size ' ) ,
ULInt8 ( ' region_code ' ) , # 0 for japan, 1 for not japan
ULInt8 ( ' old_licensee_code ' ) , # 0x33 means to use licensee_code
ULInt8 ( ' game_version ' ) ,
ULInt8 ( ' header_checksum ' ) ,
UBInt16 ( ' cart_checksum ' ) ,
)
# The mother lode — Pokémon base stats
pokemon_struct = Struct (
' pokemon ' ,
ULInt8 ( ' pokedex_number ' ) ,
ULInt8 ( ' base_hp ' ) ,
ULInt8 ( ' base_attack ' ) ,
ULInt8 ( ' base_defense ' ) ,
ULInt8 ( ' base_speed ' ) ,
ULInt8 ( ' base_special ' ) ,
IdentEnum ( ULInt8 ( ' type1 ' ) , TYPE_IDENTIFIERS ) ,
IdentEnum ( ULInt8 ( ' type2 ' ) , TYPE_IDENTIFIERS ) ,
ULInt8 ( ' catch_rate ' ) ,
ULInt8 ( ' base_experience ' ) ,
# TODO ???? "sprite dimensions"
ULInt8 ( ' _sprite_dimensions ' ) ,
ULInt16 ( ' front_sprite_pointer ' ) ,
ULInt16 ( ' back_sprite_pointer ' ) ,
# TODO somehow rig this to discard trailing zeroes; there's a paddedstring that does it
Array ( 4 , IdentEnum ( ULInt8 ( ' initial_moveset ' ) , MOVE_IDENTIFIERS ) ) ,
IdentEnum ( ULInt8 ( ' growth_rate ' ) , GROWTH_RATES ) ,
# TODO argh, this is a single huge integer; i want an array, but then i lose the byteswapping!
Bitwise (
BitField ( ' machines ' , 7 * 8 , swapped = True ) ,
) ,
Padding ( 1 ) ,
)
evos_moves_struct = Struct (
' evos_moves ' ,
NullTerminatedArray (
Struct (
' evolutions ' ,
IdentEnum ( ULInt8 ( ' evo_trigger ' ) , EVOLUTION_TRIGGERS ) ,
Embedded ( Switch (
' evo_arguments ' ,
lambda ctx : ctx . evo_trigger , {
2016-08-14 00:15:30 -07:00
' evolution-trigger.level-up ' : Struct (
2016-08-12 18:34:11 -07:00
' --- ' ,
ULInt8 ( ' evo_level ' ) ,
) ,
2016-08-14 00:15:30 -07:00
' evolution-trigger.use-item ' : Struct (
2016-08-12 18:34:11 -07:00
' --- ' ,
# TODO item enum too wow!
ULInt8 ( ' evo_item ' ) ,
# TODO ??? always seems to be 1
ULInt8 ( ' evo_level ' ) ,
) ,
# TODO ??? always seems to be 1 here too
2016-08-14 00:15:30 -07:00
' evolution-trigger.trade ' : Struct (
2016-08-12 18:34:11 -07:00
' --- ' ,
ULInt8 ( ' evo_level ' ) ,
) ,
} ,
) ) ,
# TODO alas, the species here is a number, because it's an internal
# id and we switch those back using data from the game...
ULInt8 ( ' evo_species ' ) ,
) ,
) ,
NullTerminatedArray (
Struct (
' level_up_moves ' ,
ULInt8 ( ' level ' ) ,
IdentEnum ( ULInt8 ( ' move ' ) , MOVE_IDENTIFIERS ) ,
Peek ( ULInt8 ( ' _end ' ) ) ,
) ,
) ,
)
evos_moves_pointer = Struct (
' xxx ' ,
ULInt16 ( ' offset ' ) ,
# TODO hardcoded as the same bank, ugh
Pointer ( lambda ctx : ctx . offset + ( 0xE - 1 ) * 0x4000 , evos_moves_struct ) ,
)
2016-09-10 21:23:57 -07:00
# There are actually two versions of this struct... an imperial one, used by
# the US, and a metric one, used by the ENTIRE REST OF THE WORLD. The imperial
# one has separate bytes for feet and inches, so it's a different size, making
# it completely incompatible.
pokedex_flavor_struct_metric = Struct (
' pokedex_flavor_metric ' ,
PokemonCString ( ' genus ' ) ,
2016-08-12 18:34:11 -07:00
ULInt8 ( ' height_decimeters ' ) ,
ULInt16 ( ' weight_hectograms ' ) ,
2016-09-10 21:23:57 -07:00
MacroPokemonCString ( ' flavor_text ' ) ,
2016-08-12 18:34:11 -07:00
)
2016-09-10 21:23:57 -07:00
pokedex_flavor_struct_imperial = Struct (
' pokedex_flavor_imperial ' ,
PokemonCString ( ' genus ' ) ,
ULInt8 ( ' height_feet ' ) ,
ULInt8 ( ' height_inches ' ) ,
2016-09-16 16:59:09 -07:00
ULInt16 ( ' weight_decipounds ' ) ,
2016-09-10 21:23:57 -07:00
MacroPokemonCString ( ' flavor_text ' ) ,
2016-08-12 18:34:11 -07:00
)
class CartDetectionError ( Exception ) :
pass
class RBYCart :
NUM_POKEMON = 151
NUM_MOVES = 165
NUM_MACHINES = 55
def __init__ ( self , path ) :
with path . open ( ' rb ' ) as f :
self . data = f . read ( )
self . stream = io . BytesIO ( self . data )
self . path = path
# Scrape these first; language detection relies on examining text
self . addrs = self . detect_addresses ( )
self . game , self . language = self . detect_game ( )
2016-09-10 21:23:57 -07:00
self . uses_metric = not self . language == ' en '
2016-08-12 18:34:11 -07:00
# And snag this before anything else happens; prevents some silly
# problems where a reified property seeks, then tries to read this, and
# it ends up seeking again
self . max_pokemon_index
def detect_addresses ( self ) :
""" The addresses of some important landmarks can vary between versions
and languages . Attempt to detect them automatically .
Return a dict of raw file offsets . The keys are the names used in the
pokered project .
"""
2016-08-21 16:44:07 -07:00
# The ideal approach is to find some assembly code that appears just
# before the data of interest. It's pretty hacky, but since
# translators (and even modders) would have little reason to rearrange
# functions or inject new ones in these odd places, it ought to work
# well enough. And it's better than ferreting out and hard-coding
# piles of addresses.
2016-08-12 18:34:11 -07:00
# The only hard part is that assembly code that contains an address
# won't work, since that address will also vary per game.
# Each of the landmarks used here appears in every official cartridge
# exactly once.
2016-08-21 16:44:07 -07:00
addresses = { }
2016-08-12 18:34:11 -07:00
# This is an entire function used by the Pokédex and which immediately
# precedes all the flavor text.
asm_DrawTileLine = bytes . fromhex ( ' c5d5 7019 0d20 fbd1 c1c9 ' )
try :
idx = self . data . index ( asm_DrawTileLine )
except ValueError :
raise CartDetectionError ( " Can ' t find flavor text pointers " )
addresses [ ' PokedexEntryPointers ' ] = idx + len ( asm_DrawTileLine )
2016-09-10 18:05:00 -07:00
match = find_code ( self . data , '''
; EvolutionAfterBattle :
ldh a , [ #hTilesetType]
push af
xor a
ld [ #wEvolutionOccurred], a
dec a
ld [ #wWhichPokemon], a
push hl
push bc
push de
ld hl , #wPartyCount
push hl
; Evolution_PartyMonLoop : ; loop over party mons
ld hl , #wWhichPokemon
inc [ hl ]
pop hl
inc hl
ld a , [ hl ]
cp $ ff ; have we reached the end of the party ?
jp z , #_done
ld [ #wEvoOldSpecies], a
push hl
ld a , [ #wWhichPokemon]
ld c , a
ld hl , #wCanEvolveFlags
ld b , #FLAG_TEST
call #Evolution_FlagAction
ld a , c
and a ; is the mon ' s bit set?
jp z , #Evolution_PartyMonLoop ; if not, go to the next mon
ld a , [ #wEvoOldSpecies]
dec a
ld b , 0
ld hl , #EvosMovesPointerTable
add a , a
rl b
ld c , a
add hl , bc
ld a , [ hl + ]
ld h , [ hl ]
ld l , a
push hl
ld a , [ #wcf91]
push af
xor a ; PLAYER_PARTY_DATA
ld [ #wMonDataLocation], a
call #LoadMonData
pop af
ld [ #wcf91], a
pop hl
''' ,
hTilesetType = 0xD7 , # FFD7
)
if not match :
2016-08-12 18:34:11 -07:00
raise CartDetectionError ( " Can ' t find evolution and moveset table " )
2016-09-10 18:05:00 -07:00
rem , inputs = match
# As usual, there's no bank given... but this code has to be in the
# same bank as the data it loads!
codebank , _ = bank ( rem . start ( ) )
addresses [ ' EvosMovesPointerTable ' ] = unbank (
codebank , inputs [ ' EvosMovesPointerTable ' ] )
2016-08-12 18:34:11 -07:00
2016-08-21 16:44:07 -07:00
# Several lists of names are accessed by a single function, which looks
# through a list of pointers to find the right set of names to use.
# That's great news for me: I can just grab all of those delicious
# pointers at once. Here's an excerpt from GetName.
match = find_code ( self . data , '''
inc d
; . skip
ld hl , #NamePointers
add hl , de
ld a , [ hl + ]
ldh [ $ 96 ] , a
ld a , [ hl ]
ldh [ $ 95 ] , a
ldh a , [ $ 95 ]
ld h , a
ldh a , [ $ 96 ]
ld l , a
ld a , [ #wd0b5]
ld b , a
ld c , 0
; . nextName
ld d , h
ld e , l
; . nextChar
ld a , [ hl + ]
cp $ 50 ; terminator @ , encoded
''' )
if not match :
raise CartDetectionError ( " Can ' t find name array " )
rem , inputs = match
start = inputs [ ' NamePointers ' ]
name_pointers = Array ( 7 , ULInt16 ( ' dummy ' ) ) . parse (
self . data [ start : start + 14 ] )
# One downside to the Game Boy memory structure is that banks are
# not stored anywhere near their corresponding addresses. Most
# bank numbers are hardcoded here, but Pokémon names are in a different
# bank in Japanese games, so we've gotta scrape the bank too...
match = find_code ( self . data , '''
; GetMonName : :
push hl
ldh a , [ #H_LOADEDROMBANK]
push af
ld a , #BANK_MonsterNames
''' ,
H_LOADEDROMBANK = 0xB8 , # full address is $FFB8; ldh adds the $FF
MBC1RomBank = 0x2000 ,
MonsterNames = name_pointers [ 0 ]
)
if not match :
raise CartDetectionError ( " Can ' t find Pokémon names " )
rem , inputs = match
addresses [ ' MonsterNames ' ] = unbank (
inputs [ ' BANK_MonsterNames ' ] , name_pointers [ 0 ] )
addresses [ ' MoveNames ' ] = unbank ( 0x2C , name_pointers [ 1 ] )
# 2: UnusedNames (unused, obviously)
addresses [ ' ItemNames ' ] = unbank ( 0x01 , name_pointers [ 3 ] )
# 4: wPartyMonOT (only useful while the game is running)
# 5: wEnemyMonOT (only useful while the game is running)
addresses [ ' TrainerNames ' ] = unbank ( 0x0E , name_pointers [ 6 ] )
2016-08-12 18:34:11 -07:00
# Finding TMs is a bit harder. They come right after a function for
# looking up a TM number, which is very short and very full of
# addresses. So here's a regex.
# `wd11e` is some address used all over the game for passing arguments
# around, which unfortunately also differs from language to language.
# In English it is, unsurprisingly, 0xD11E.
# `TechnicalMachines` is the address we're looking for, which should
# immediately follow what this matches.
2016-08-21 16:44:07 -07:00
match = find_code ( self . data , '''
ld a , [ #wd11e]
dec a
ld hl , #TechnicalMachines
ld b , $ 0
ld c , a
add hl , bc
ld a , [ hl ]
ld [ #wd11e], a
ret
''' )
if match :
rem , inputs = match
# TODO this should mayybe also check that the address immediately follows this code
matched_addr = inputs [ ' TechnicalMachines ' ]
tentative_addr = rem . end ( )
2016-08-12 18:34:11 -07:00
# Remember, addresses don't include the bank!
_ , banked_addr = bank ( tentative_addr )
if matched_addr == banked_addr :
2016-08-21 16:44:07 -07:00
asm_wd11e_addr = inputs [ ' wd11e ' ]
2016-08-12 18:34:11 -07:00
addresses [ ' TechnicalMachines ' ] = tentative_addr
2016-08-21 16:44:07 -07:00
else :
raise RuntimeError
2016-08-12 18:34:11 -07:00
# TODO should there really be more than one match?
else :
raise CartDetectionError ( " Can ' t find technical machines list " )
# Pokédex order is similarly tricky. Much like the above, this
# function converts a Pokémon's game index to its national dex number.
# These are almost immediately after the Pokédex entries themselves,
# but this actually seems easier than figuring out where a table of
# pointers ends.
2016-08-21 16:44:07 -07:00
match = find_code ( self . data , '''
push bc
push hl
ld a , [ #wd11e]
dec a
ld hl , #PokedexOrder
ld b , 0
ld c , a
add hl , bc
ld a , [ hl ]
ld [ #wd11e], a
pop hl
pop bc
ret
''' , wd11e=asm_wd11e_addr)
if match :
rem , inputs = match
matched_addr = inputs [ ' PokedexOrder ' ]
tentative_addr = rem . end ( )
2016-08-12 18:34:11 -07:00
# Remember, addresses don't include the bank!
_ , banked_addr = bank ( tentative_addr )
2016-08-21 16:44:07 -07:00
if matched_addr == banked_addr :
2016-08-12 18:34:11 -07:00
addresses [ ' PokedexOrder ' ] = tentative_addr
2016-08-21 16:44:07 -07:00
else :
raise RuntimeError
2016-08-12 18:34:11 -07:00
else :
raise CartDetectionError ( " Can ' t find Pokédex order " )
2016-08-21 16:44:07 -07:00
# Ah, but then, we have base stats. These don't have code nearby;
# they're just stuck immediately after moves. Except in R/G, where
# they appear /before/ moves! And we don't know what version we're
# running yet, because the addresses detected in this method are used
# for language detection. Hmm.
# Here's plan B: look for the function that /loads/ base stats, and
# scrape the address out of it. This function is a bit hairy; I've had
# to expand some of pokered's macros and rewrite the jumps to something
2016-09-10 18:05:00 -07:00
# that the rudimentary code matcher can understand. Also, there were
# two edits made in Yellow: bank switching is done with a function
# rather inlined, and Mew is no longer separate.
# TODO i guess it would be nice if find_code could deal with this,
# seeing as it IS just a regex, but i don't know how i'd cram the
# syntax in without a real parser™
rgb_bits = dict (
bankswitch = """
ldh [ #H_LOADEDROMBANK], a
ld [ #MBC1RomBank], a
""" ,
mewjump = """
cp #MEW
jr z , #mew
""" ,
mewblock = """
jr #done2
; . mew
ld hl , #MewBaseStats
ld de , #wMonHeader
ld bc , #MonBaseStatsLength
ld a , #BANK_MewBaseStats
call #FarCopyData
""" ,
2016-08-21 16:44:07 -07:00
)
2016-09-10 18:05:00 -07:00
yellow_bits = dict (
bankswitch = """
call #BankswitchCommon
""" ,
mewjump = " " ,
mewblock = " " ,
)
for bits in ( rgb_bits , yellow_bits ) :
code = '''
ldh a , [ #H_LOADEDROMBANK]
push af
ld a , #BANK_BaseStats
{ bankswitch }
push bc
push de
push hl
ld a , [ #wd11e]
push af
ld a , [ #wd0b5]
ld [ #wd11e],a
ld de , #FossilKabutopsPic
ld b , $ 66 ; size of Kabutops fossil and Ghost sprites
cp #FOSSIL_KABUTOPS ; Kabutops fossil
jr z , #specialID1
ld de , #GhostPic
cp #MON_GHOST ; Ghost
jr z , #specialID2
ld de , #FossilAerodactylPic
ld b , $ 77 ; size of Aerodactyl fossil sprite
cp #FOSSIL_AERODACTYL ; Aerodactyl fossil
jr z , #specialID3
{ mewjump }
ld a , #IndexToPokedexPredef
call #IndexToPokedex ; convert pokemon ID in [wd11e] to pokedex number
ld a , [ #wd11e]
dec a
ld bc , #MonBaseStatsLength
ld hl , #BaseStats
call #AddNTimes
ld de , #wMonHeader
ld bc , #MonBaseStatsLength
call #CopyData
jr #done1
; . specialID
ld hl , #wMonHSpriteDim
ld [ hl ] , b ; write sprite dimensions
inc hl
ld [ hl ] , e ; write front sprite pointer
inc hl
ld [ hl ] , d
{ mewblock }
''' .format(**bits)
match = find_code (
self . data ,
code ,
# These are constants; I left them in the above code for clarity
H_LOADEDROMBANK = 0xB8 , # full address is $FFB8; ldh adds the $FF
MBC1RomBank = 0x2000 ,
# This was scraped previously
wd11e = asm_wd11e_addr ,
)
if match :
rem , inputs = match
addresses [ ' BaseStats ' ] = unbank (
inputs [ ' BANK_BaseStats ' ] , inputs [ ' BaseStats ' ] )
if ' MewBaseStats ' in inputs :
addresses [ ' MewBaseStats ' ] = unbank (
inputs [ ' BANK_MewBaseStats ' ] , inputs [ ' MewBaseStats ' ] )
else :
addresses [ ' MewBaseStats ' ] = None
break
2016-08-21 16:44:07 -07:00
else :
raise CartDetectionError ( " Can ' t find base stats " )
2016-08-12 18:34:11 -07:00
return addresses
def detect_game ( self ) :
""" Given a cart image, return the game and language.
This is a high - level interface ; it prints stuff to stdout and raises
exceptions . Its two helpers do not .
"""
# TODO raise, don't print to stdout
# We have checksums for each of the games, but we also want to support
# a heuristic so this same code can be used for trimmed carts,
# bootlegs, fan hacks, corrupted carts, and other interesting variants.
# Try both, and warn if they don't agree.
game_c , language_c = self . detect_game_checksum ( )
game_h , language_h = self . detect_game_heuristic ( )
game = game_c or game_h
language = language_c or language_h
if game and language :
print ( " Detected {filename} as {game} , {language} " . format (
filename = self . path . name , game = game , language = language ) )
else :
print ( " Can ' t figure out what game {filename} is! " . format (
filename = self . path . name ) , end = ' ' )
if game :
# TODO should probably be a way to override this
print ( " It seems to be {} , but I can ' t figure out the language. " . format ( game ) )
elif language :
print ( " It seems to use {} text, but I can ' t figure out the version. " . format ( language ) )
else :
print ( " Nothing about it is familiar to me. " )
print ( " Bailing, sorry :( " )
sys . exit ( 1 )
# Warn about a potentially bad checksum
if not game_c or not language_c :
log . warn (
2016-09-10 21:23:57 -07:00
" Hmm. I don ' t recognize the checksum for %s , but I ' ll "
2016-08-12 18:34:11 -07:00
" continue anyway. " ,
self . path . name )
elif game_c != game_h or language_c != language_h :
log . warn (
" This is very surprising. The checksum indicates that this "
2016-09-10 21:23:57 -07:00
" game should be %s , %s , but I detected it as %s , %s . Probably "
2016-08-12 18:34:11 -07:00
" my fault, not yours. Continuing anyway. " ,
game_c , language_c , game_h , language_h )
return game , language
def detect_game_checksum ( self ) :
h = hashlib . md5 ( )
h . update ( self . data )
md5sum = h . hexdigest ( )
return GAME_RELEASE_MD5SUM_INDEX . get ( md5sum , ( None , None ) )
def detect_game_heuristic ( self ) :
# Okay, so, fun story: there's nothing /officially/ distinguishing the
# games. There's a flag in the cartridge header that's 0 for Japan and
# 1 for anywhere other than Japan, but every copy of the game I've seen
# has it set to anything other than 0 or 1, so that doesn't seem
# particularly reliable. I can't find any official and documented
# difference. It's as if they just changed the text, reassembled, and
# called it a day. In fact that's probably exactly what happened.
# That makes life a little more difficult, so let's take this a step at
# a time. We can get the name of the game for free, at least, from the
# cartridge header.
self . stream . seek ( 0x100 )
header = game_boy_header_struct . parse_stream ( self . stream )
# Nintendo decided to lop off the last five bytes of the title for
# other purposes /after/ creating the Game Boy, so the last three
# letters of e.g. POKEMON YELLOW end up in the manufacturer code.
# Let's just, ah, put those back on.
title = header . title + header . manufacturer_code . rstrip ( b ' \x00 ' )
if title == b ' POKEMON RED ' :
version = ' red '
elif title == b ' POKEMON GREEN ' :
version = ' green '
elif title == b ' POKEMON BLUE ' :
version = ' blue '
elif title == b ' POKEMON YELLOW ' :
version = ' yellow '
else :
version = None
# There's still a problem here: "red" might mean the Red from
# Red/Green, released only in Japan; or the Red from Red/Blue, the pair
# released worldwide, based on Japanese Blue.
# Easy way to tell: Red and Green are the only games in the entire
# series to use a half megabyte cartridge. Any other game, even if
# trimmed, will be just barely too big to fit in that size.
if header . rom_size == 4 : # 512K -> Red/Green
if version == ' red ' :
game = ' jp-red '
elif version == ' green ' :
game = ' jp-green '
else :
# No other game is this size
game = None
elif header . rom_size == 5 : # 1M -> Red/Blue/Yellow
if version == ' green ' :
# Doesn't make sense; there was no green game bigger than 512K
game = None
elif version == ' red ' :
game = ' ww-red '
elif version == ' blue ' :
# Can't know which Blue this is until we get the language
game = None
else :
game = version
else : # ???
return None , None
# Now for language. If the game is Japanese Red or Green, then it must
# be in Japanese, so we're done.
if game in ( ' jp-red ' , ' jp-green ' ) :
language = ' ja '
return game , language
# Otherwise, the only way to be absolutely sure is to find some text
# and see what language it's in.
self . stream . seek ( self . addrs [ ' ItemNames ' ] )
# Item 0 is MASTER BALL. The first item with a different name in every
# single language is item 4, TOWN MAP, so chew through five names.
single_string_struct = PokemonCString ( ' dummy ' )
for _ in range ( 5 ) :
name = single_string_struct . parse_stream ( self . stream )
for language , expected_name in [
( ' de ' , ' KARTE ' ) ,
( ' en ' , ' TOWN MAP ' ) ,
( ' es ' , ' MAPA PUEBLO ' ) ,
( ' fr ' , ' CARTE ' ) ,
( ' it ' , ' MAPPA CITTÀ ' ) ,
( ' ja ' , ' タウンマップ ' ) ,
] :
if name . decrypt ( language ) == expected_name :
break
else :
# TODO raise probably
language = None
# Blue is a special case, remember
if game is None and version == ' blue ' :
if language is None :
pass
elif language == ' ja ' :
game = ' jp-blue '
else :
game = ' ww-blue '
# And done!
return game , language
### From here it's all reified properties that extract on demand
@reify
def pokedex_order ( self ) :
""" Maps internal Pokémon indices to the more familiar Pokédex order.
Note that this maps to ONE LESS THAN National Dex number , so lists
can be zero - indexed .
"""
# Fetch the conversions between internal numbering and Pokédex order,
# because that's a thing Gen 1 does, for some reason.
self . stream . seek ( self . addrs [ ' PokedexOrder ' ] )
# I don't know exactly how many numbers are in this array, but it's
# more than the number of Pokémon, because there are some MISSINGNO
# gaps. It's single bytes anyway, so I'm going to keep reading them
# until I've seen every valid dex number.
unseen_dex_numbers = set ( range ( 1 , self . NUM_POKEMON + 1 ) )
internal_to_dex_order = { }
for index , dex_number in enumerate ( self . stream . read ( 256 ) , start = 1 ) :
if dex_number == 0 :
continue
internal_to_dex_order [ index ] = dex_number - 1
unseen_dex_numbers . remove ( dex_number )
if not unseen_dex_numbers :
break
assert not unseen_dex_numbers
return internal_to_dex_order
@reify
def max_pokemon_index ( self ) :
""" Largest valid value of a Pokémon index. Note that not every index
between 0 and this number is necessarily a valid Pokémon ; many of them
are Missingno . Only numbers that appear in ` pokedex_order ` are legit .
"""
return max ( self . pokedex_order )
@reify
def pokemon_names ( self ) :
""" List of Pokémon names, in Pokédex order. """
ret = [ None ] * self . NUM_POKEMON
self . stream . seek ( self . addrs [ ' MonsterNames ' ] )
2016-08-21 16:44:07 -07:00
# TODO i don't like this, but they don't have explicit terminators...
if self . language == ' ja ' :
name_length = 5
else :
name_length = 10
for index , pokemon_name in enumerate ( Array ( self . max_pokemon_index , PokemonCString ( ' ... ' , name_length ) ) . parse_stream ( self . stream ) , start = 1 ) :
2016-08-12 18:34:11 -07:00
try :
id = self . pokedex_order [ index ]
except KeyError :
continue
ret [ id ] = pokemon_name . decrypt ( self . language )
return ret
@reify
def machine_moves ( self ) :
""" List of move identifiers corresponding to TMs/HMs. """
self . stream . seek ( self . addrs [ ' TechnicalMachines ' ] )
return Array ( self . NUM_MACHINES , IdentEnum ( ULInt8 ( ' move ' ) , MOVE_IDENTIFIERS ) ) . parse_stream ( self . stream )
@reify
def pokemon_records ( self ) :
""" List of pokemon_structs. """
self . stream . seek ( self . addrs [ ' BaseStats ' ] )
2016-09-10 18:05:00 -07:00
# Mew's data is, awkwardly, stored separately pre-Yellow
if self . addrs [ ' MewBaseStats ' ] :
records = Array ( self . NUM_POKEMON - 1 , pokemon_struct ) . parse_stream ( self . stream )
self . stream . seek ( self . addrs [ ' MewBaseStats ' ] )
records . append ( pokemon_struct . parse_stream ( self . stream ) )
else :
records = Array ( self . NUM_POKEMON , pokemon_struct ) . parse_stream ( self . stream )
2016-08-12 18:34:11 -07:00
return records
@reify
def pokemon_evos_and_moves ( self ) :
""" List of evos_moves_structs, including both evolutions and level-up
moves .
"""
ret = [ None ] * self . NUM_POKEMON
self . stream . seek ( self . addrs [ ' EvosMovesPointerTable ' ] )
for index , pointer in enumerate ( Array ( self . max_pokemon_index , evos_moves_pointer ) . parse_stream ( self . stream ) , start = 1 ) :
try :
id = self . pokedex_order [ index ]
except KeyError :
continue
ret [ id ] = pointer . evos_moves
return ret
@reify
def pokedex_entries ( self ) :
""" List of pokedex_flavor_structs. """
ret = [ None ] * self . NUM_POKEMON
2016-09-10 21:23:57 -07:00
dex_bank , _ = bank ( self . addrs [ ' PokedexEntryPointers ' ] )
if self . uses_metric :
pokedex_flavor_struct = pokedex_flavor_struct_metric
else :
pokedex_flavor_struct = pokedex_flavor_struct_imperial
2016-08-12 18:34:11 -07:00
self . stream . seek ( self . addrs [ ' PokedexEntryPointers ' ] )
2016-09-10 21:23:57 -07:00
# This address is just an array of pointers
for index , address in enumerate ( Array ( self . max_pokemon_index , ULInt16 ( ' pointer ' ) ) . parse_stream ( self . stream ) , start = 1 ) :
2016-08-12 18:34:11 -07:00
try :
id = self . pokedex_order [ index ]
except KeyError :
continue
2016-09-10 21:23:57 -07:00
self . stream . seek ( unbank ( dex_bank , address ) )
ret [ id ] = pokedex_flavor_struct . parse_stream ( self . stream )
2016-08-12 18:34:11 -07:00
2016-09-10 21:23:57 -07:00
return ret
2016-08-12 18:34:11 -07:00
@reify
def move_names ( self ) :
self . stream . seek ( self . addrs [ ' MoveNames ' ] )
return Array ( NUM_MOVES , PokemonCString ( ' move_name ' ) ) . parse_stream ( self . stream )
# TODO would be slick to convert this to a construct... construct
def bitfield_to_machines ( bits , machine_moves ) :
machines = [ ]
for i , move in enumerate ( machine_moves , start = 1 ) :
bit = bits & 0x1
bits >> = 1
if bit :
machines . append ( move )
return machines
class WriterWrapper :
def __init__ ( self , locus , language ) :
self . locus = locus
self . language = language
def __setattr__ ( self , key , value ) :
# TODO finish this...
# 1. disallow reassigning an existing attr with a value
setattr ( self . locus , key , value )
def __getattr__ ( self , key ) :
return getattr ( self . locus , key )
2016-09-10 18:05:41 -07:00
def main ( base_root ) :
2016-08-12 18:34:11 -07:00
# TODO does this need to take arguments? or like, sprite mode i guess
2016-09-10 18:05:41 -07:00
carts = defaultdict ( dict ) # game => language => RBYCart
2016-08-12 18:34:11 -07:00
for filename in sys . argv [ 1 : ] :
cart = RBYCart ( Path ( filename ) )
2016-09-10 18:05:41 -07:00
game_carts = carts [ cart . game ]
if cart . language in game_carts :
print (
" WARNING: ignoring {0.path} because it ' s the same game and "
" language ( {0.game} , {0.language} ) as {1.path} "
. format ( cart , game_carts [ cart . language ] ) )
continue
game_carts [ cart . language ] = cart
for game , game_carts in sorted ( carts . items ( ) ) :
print ( )
print ( " Dumping " , game )
if game in GAME_RELEASE_MD5SUMS :
got_languages = game_carts . keys ( )
expected_languages = GAME_RELEASE_MD5SUMS [ game ] . keys ( )
extra_languages = got_languages - expected_languages
if extra_languages :
print (
" WARNING: don ' t recognize languages {} "
. format ( ' , ' . join ( sorted ( extra_languages ) ) ) )
missing_languages = expected_languages - got_languages
if missing_languages :
print (
" WARNING: missing cartridges for {} — this dump will "
" be incomplete! "
. format ( ' , ' . join ( sorted ( missing_languages ) ) ) )
root = base_root / game
root . mkdir ( exist_ok = True )
pokemons = None
for language , cart in sorted ( game_carts . items ( ) ) :
if pokemons is None :
pokemons = OrderedDict ( [
( POKEMON_IDENTIFIERS [ id + 1 ] , schema . Pokemon ( ) )
for id in range ( cart . NUM_POKEMON )
] )
for id in range ( cart . NUM_POKEMON ) :
pokemon = pokemons [ POKEMON_IDENTIFIERS [ id + 1 ] ]
#writer = WriterWrapper(pokemon)
writer = pokemon
# TODO LOLLLL
if ' name ' not in writer . __dict__ :
writer . name = { }
writer . name [ cart . language ] = cart . pokemon_names [ id ]
record = cart . pokemon_records [ id ]
# TODO put this in construct
types = [ record . type1 ]
if record . type1 != record . type2 :
types . append ( record . type2 )
writer . types = types
writer . base_stats = {
' hp ' : record . base_hp ,
' attack ' : record . base_attack ,
' defense ' : record . base_defense ,
' speed ' : record . base_speed ,
' special ' : record . base_special ,
2016-08-12 18:34:11 -07:00
}
2016-09-10 18:05:41 -07:00
writer . growth_rate = record . growth_rate
writer . base_experience = record . base_experience
#writer.pokedex_numbers = dict(kanto=record.pokedex_number)
# Starting moves are stored with the Pokémon; other level-up
# moves are stored with evolutions
level_up_moves = [
{ 1 : move }
for move in record . initial_moveset
# TODO UGH
if move != ' -- '
]
for level_up_move in cart . pokemon_evos_and_moves [ id ] . level_up_moves :
level_up_moves . append ( {
level_up_move . level : level_up_move . move ,
} )
# TODO LOLLLL
if ' moves ' not in writer . __dict__ :
writer . moves = { }
writer . moves [ ' level-up ' ] = level_up_moves
writer . moves [ ' machines ' ] = bitfield_to_machines (
record . machines , cart . machine_moves )
# Evolution
# TODO alas, the species here is a number, because it's an
# internal id and we switch those back using data from the
# game...
evolutions = [ ]
for evo_datum in cart . pokemon_evos_and_moves [ id ] . evolutions :
evo = {
' into ' : POKEMON_IDENTIFIERS [ cart . pokedex_order [ evo_datum . evo_species ] + 1 ] ,
' trigger ' : evo_datum . evo_trigger ,
' minimum-level ' : evo_datum . evo_level ,
}
# TODO insert the item trigger!
evolutions . append ( evo )
writer . evolutions = evolutions
2016-09-10 21:23:57 -07:00
# Pokédex flavor
flavor_struct = cart . pokedex_entries [ id ]
# TODO LOLLLL
if ' genus ' not in writer . __dict__ :
writer . genus = { }
writer . genus [ cart . language ] = flavor_struct . genus . decrypt ( language )
if ' flavor_text ' not in writer . __dict__ :
writer . flavor_text = { }
writer . flavor_text [ cart . language ] = flavor_struct . flavor_text . decrypt ( language )
if cart . uses_metric :
writer . height = 1000 * flavor_struct . height_decimeters
writer . weight = 100000000 * flavor_struct . weight_hectograms
else :
writer . height = 254 * (
12 * flavor_struct . height_feet
+ flavor_struct . height_inches )
2016-09-16 16:59:09 -07:00
writer . weight = 45359237 * flavor_struct . weight_decipounds
2016-09-10 21:23:57 -07:00
2016-09-10 18:05:41 -07:00
fn = root / ' pokemon.yaml '
print ( ' Writing ' , fn )
with fn . open ( ' w ' ) as f :
f . write ( Camel ( [ schema . POKEDEX_TYPES ] ) . dump ( pokemons ) )
2016-08-12 18:34:11 -07:00
if __name__ == ' __main__ ' :
2016-08-14 00:15:30 -07:00
# TODO yeah fix this up
main ( Path ( ' pokedex/data ' ) )