The source website uses <span class='energy-text energy-text--type-fire'> to render inline energy icons. BeautifulSoup's get_text() was stripping these spans, losing the energy type information and causing merged text like 'Discard aEnergy' instead of 'Discard a Fire Energy'. Changes: - Add ENERGY_TEXT_TYPES mapping for inline energy references - Add replace_energy_text_spans() to convert spans to text before extraction - Add extract_effect_text() helper with proper text joining (separator=' ') - Update parse_attack(), parse_ability(), _parse_trainer_details() to use it - Fix JSON encoding in convert_cards.py to use UTF-8 (ensure_ascii=False) Before: 'Discard an Energy from this Pokémon' After: 'Discard a Fire Energy from this Pokémon' Re-scraped all 372 cards and regenerated 382 definitions.
42 lines
811 B
JSON
42 lines
811 B
JSON
{
|
|
"id": "a1-004-venusaur-ex",
|
|
"name": "Venusaur ex",
|
|
"card_type": "pokemon",
|
|
"hp": 190,
|
|
"pokemon_type": "grass",
|
|
"stage": "stage_2",
|
|
"variant": "ex",
|
|
"retreat_cost": 3,
|
|
"set_id": "a1",
|
|
"rarity": "double rare",
|
|
"evolves_from": "Ivysaur",
|
|
"attacks": [
|
|
{
|
|
"name": "Razor Leaf",
|
|
"cost": [
|
|
"grass",
|
|
"colorless",
|
|
"colorless"
|
|
],
|
|
"damage": 60,
|
|
"damage_display": "60"
|
|
},
|
|
{
|
|
"name": "Giant Bloom",
|
|
"cost": [
|
|
"grass",
|
|
"grass",
|
|
"colorless",
|
|
"colorless"
|
|
],
|
|
"damage": 100,
|
|
"damage_display": "100",
|
|
"effect_description": "Heal 30 damage from this Pokémon."
|
|
}
|
|
],
|
|
"weakness": {
|
|
"energy_type": "fire",
|
|
"value": 20
|
|
},
|
|
"illustrator": "PLANETA CG Works"
|
|
} |