Skip to main content
cancel
Showing results for 
Search instead for 
Did you mean: 

Join us for an expert-led overview of the tools and concepts you'll need to become a Certified Power BI Data Analyst and pass exam PL-300. Register now.

Reply
alexha73
Regular Visitor

Data modeling after webscraping

Dear All,

 

 After some time I have been able to created a python script that scrapes game fixtures and saves it in a json format. Here is an extract of the information from 2 games:

 

{
"Temporada": "TEMPORADA 2022-2023",
"Data": "Data: 24-09-2022, 12:30h",
"Jornada": "Jornada 1",
"Àrbitres": [
"GARCIA MUÑOZ, ORIOL",
"ABELLO LILLO, SERGI",
"LOPEZ RODRIGUEZ, FELIPE"
],
"Gols": { "Nom": "BERNAL CASAS, MARC", "Minut": "79'", "Tipus": "normal" },
"Estadi": [
"CAMP DE FUTBOL CIUTAT ESPORTIVA JOAN GAMPER (Artificial)",
"av. del Sol, s/n, Sant Joan Despí"
],
"Comparativa": { "team1": "BARCELONA, F.C. A", "team2": "DAMM, C.F. A" },
"BARCELONA, F.C. A": {
"Titulars": {
"1": "SAUCEDO AVAROMA, JORDI",
"2": "VICTOR DELGADO, GUILLEM",
"3": "NATALI , ANDREA",
"4": "CUENCA CEJUDO, ANDRES",
"5": "TORRENTS SALVAT, JOFRE",
"6": "BERNAL CASAS, MARC",
"7": "DE MIGUEL LLAVE, CARLOS",
"8": "AVILA MARMOL, DANIEL",
"9": "HERNANDEZ TORRES, JUAN",
"10": "JUNYENT CASANOVA, QUIM",
"11": "KLUIVERT , SHANE PATRICK"
},
"Suplents": {
"12": "FARRÉ MIRÓ, LANDRY CÉPHAS",
"13": "BONFILL COLL, MAX",
"14": "FERNANDEZ CASINO, GUILLERMO",
"15": "SACA , LEONARD",
"16": "ESPART FONT, XAVI",
"17": "SYLLA DIALLO, NOUHOUN",
"18": "GISTAU FERREÑO, ÓSCAR"
},
"Equip Tècnic": [
"CARRASCO PEREA, IVAN",
"SUAREZ GALVAN, ANTONIO",
"BLANCO MORENO, ARNAU",
"PONS MARTINEZ, SIMON",
"REINA VILLATORO, SAUL",
"RIVAS GONZALEZ, PABLO"
],
"Targetes": {
"5": {
"Nom": "TORRENTS SALVAT, JOFRE",
"Minut": "36'",
"Targeta": "groga"
}
}
},
"DAMM, C.F. A": {
"Titulars": {
"1": "ESTEVEZ RUBIO, MANEL",
"2": "BORREGO CRUZADO, DAVID",
"3": "RAFÚS AULET, JORDI",
"4": "MEDINA LOPEZ, JOAN",
"5": "ANGLADA GARCIA MIRANDA, GUILLEM",
"6": "RICO CORDERO, POL",
"7": "VILLARRASO SAMPER, NIL",
"8": "ISERN GENE, ORIOL",
"9": "GONZALEZ YANES, ALEX",
"10": "RUBIRA COLAS, ADRIA",
"11": "SOLA BURGOS, IAN"
},
"Suplents": {
"12": "ROUCO BARRENA, HUGO",
"13": "LOPEZ PASCUAL, PAU",
"14": "LARGO SILVESTRE, PAU",
"15": "FERNANDEZ MARTINEZ, ELLIOT",
"16": "MORALES GOMEZ, CRISTOBAL",
"17": "DEL MORAL RUZAFA, IKER",
"18": "RIOS PEREZ, JOSE LUIS"
},
"Equip Tècnic": [
"MENGUAL GALINDO, ANTONIO",
"FALCES VIÑOLA, IGNACIO",
"MONZONÍS ZORRILLA, CARLOS ",
"MORALES SUBIRACHS, GENÍS"
],
"Targetes": {
"10": {
"Nom": "RUBIRA COLAS, ADRIA",
"Minut": "17'",
"Targeta": "groga"
},
"16": {
"Nom": "MORALES GOMEZ, CRISTOBAL",
"Minut": "79'",
"Targeta": "groga"
}
}
}
},
{
"Temporada": "TEMPORADA 2022-2023",
"Data": "Data: 19-11-2022, 11:30h",
"Jornada": "Jornada 9",
"Àrbitres": [
"GONZALEZ FERRER, PABLO",
"AARAB AARAB, ADAM",
"CRIVILLERS COLL, MIRTA"
],

 

After importing the JSON into Power Bi, the way it does its magic is not very helpful to build interesting data. For example, I cannot see an easy way to calculate how many goals have been scored in total, or how many bookings on a particular game. 

 

I would kindly like to have some guidance on what should be the approach to transform the data in Power BI to make it easier to work with.

 

Thanks,

 

{
"Temporada": "TEMPORADA 2022-2023",
"Data": "Data: 24-09-2022, 12:30h",
"Jornada": "Jornada 1",
"Àrbitres": [
"GARCIA MUÑOZ, ORIOL",
"ABELLO LILLO, SERGI",
"LOPEZ RODRIGUEZ, FELIPE"
],
"Gols": { "Nom": "BERNAL CASAS, MARC", "Minut": "79'", "Tipus": "normal" },
"Estadi": [
"CAMP DE FUTBOL CIUTAT ESPORTIVA JOAN GAMPER (Artificial)",
"av. del Sol, s/n, Sant Joan Despí"
],
"Comparativa": { "team1": "BARCELONA, F.C. A", "team2": "DAMM, C.F. A" },
"BARCELONA, F.C. A": {
"Titulars": {
"1": "SAUCEDO AVAROMA, JORDI",
"2": "VICTOR DELGADO, GUILLEM",
"3": "NATALI , ANDREA",
"4": "CUENCA CEJUDO, ANDRES",
"5": "TORRENTS SALVAT, JOFRE",
"6": "BERNAL CASAS, MARC",
"7": "DE MIGUEL LLAVE, CARLOS",
"8": "AVILA MARMOL, DANIEL",
"9": "HERNANDEZ TORRES, JUAN",
"10": "JUNYENT CASANOVA, QUIM",
"11": "KLUIVERT , SHANE PATRICK"
},
"Suplents": {
"12": "FARRÉ MIRÓ, LANDRY CÉPHAS",
"13": "BONFILL COLL, MAX",
"14": "FERNANDEZ CASINO, GUILLERMO",
"15": "SACA , LEONARD",
"16": "ESPART FONT, XAVI",
"17": "SYLLA DIALLO, NOUHOUN",
"18": "GISTAU FERREÑO, ÓSCAR"
},
"Equip Tècnic": [
"CARRASCO PEREA, IVAN",
"SUAREZ GALVAN, ANTONIO",
"BLANCO MORENO, ARNAU",
"PONS MARTINEZ, SIMON",
"REINA VILLATORO, SAUL",
"RIVAS GONZALEZ, PABLO"
],
"Targetes": {
"5": {
"Nom": "TORRENTS SALVAT, JOFRE",
"Minut": "36'",
"Targeta": "groga"
}
}
},
"DAMM, C.F. A": {
"Titulars": {
"1": "ESTEVEZ RUBIO, MANEL",
"2": "BORREGO CRUZADO, DAVID",
"3": "RAFÚS AULET, JORDI",
"4": "MEDINA LOPEZ, JOAN",
"5": "ANGLADA GARCIA MIRANDA, GUILLEM",
"6": "RICO CORDERO, POL",
"7": "VILLARRASO SAMPER, NIL",
"8": "ISERN GENE, ORIOL",
"9": "GONZALEZ YANES, ALEX",
"10": "RUBIRA COLAS, ADRIA",
"11": "SOLA BURGOS, IAN"
},
"Suplents": {
"12": "ROUCO BARRENA, HUGO",
"13": "LOPEZ PASCUAL, PAU",
"14": "LARGO SILVESTRE, PAU",
"15": "FERNANDEZ MARTINEZ, ELLIOT",
"16": "MORALES GOMEZ, CRISTOBAL",
"17": "DEL MORAL RUZAFA, IKER",
"18": "RIOS PEREZ, JOSE LUIS"
},
"Equip Tècnic": [
"MENGUAL GALINDO, ANTONIO",
"FALCES VIÑOLA, IGNACIO",
"MONZONÍS ZORRILLA, CARLOS ",
"MORALES SUBIRACHS, GENÍS"
],
"Targetes": {
"10": {
"Nom": "RUBIRA COLAS, ADRIA",
"Minut": "17'",
"Targeta": "groga"
},
"16": {
"Nom": "MORALES GOMEZ, CRISTOBAL",
"Minut": "79'",
"Targeta": "groga"
}
}
}
},
{
"Temporada": "TEMPORADA 2022-2023",
"Data": "Data: 19-11-2022, 11:30h",
"Jornada": "Jornada 9",
"Àrbitres": [
"GONZALEZ FERRER, PABLO",
"AARAB AARAB, ADAM",
"CRIVILLERS COLL, MIRTA"
],
"Gols": { "Nom": "ARQUÉS LLUMÀ, MARC", "Minut": "73'", "Tipus": "normal" },
"Estadi": [
"CAMP DE FUTBOL MPAL. DE SANTA EULÀLIA DE RIUPRIMER",
"c/ Nou, s/n (final), Santa Eulàlia De Riuprimer"
],
"Comparativa": {
"team1": "VIC RIUPRIMER REFO FUTBOL CLUB A",
"team2": "GIMNASTIC TARRAGONA, C. A"
},
"VIC RIUPRIMER REFO FUTBOL CLUB A": {
"Titulars": {
"13": "ODELL SERRA, SIMON PARIS",
"3": "CASTANY FÀBREGAS, EUDALD",
"5": "CALVET SANDEZ, RAMON",
"9": "BARRIS MACIAS, ALBERT ",
"10": "BOSCH VALLS, ORIOL",
"11": "ABOAGYE ABOAGYE, ANDREWS ANSU",
"12": "PUJOLS RIAL, PERE",
"15": "MONSO PRAT, GUIU",
"16": "COMA PUJOL, LLUC",
"17": "ASENSIO GONZALEZ, ARNAU",
"18": "IBARS CUBERAS, ELOI"
},
"Suplents": {
"1": "MORERA GRANE, ARNAU",
"6": "ARQUÉS LLUMÀ, MARC",
"7": "BENITO DUOCASTELLA, BIEL",
"8": "PUIG CRUELLS, EDUARD",
"14": "FONT DOMÈNECH, ALEIX"
},
"Equip Tècnic": ["CODINA CASALS, ENRIC", "SURIÑACH VACAS, ERNEST"]
},
"GIMNASTIC TARRAGONA, C. A": {
"Titulars": {
"1": "RUIZ MONCADA, ADRIA",
"2": "SUBIRATS NAVARRO, ORIOL",
"3": "MUÑIDO LUPIAÑEZ, DIEGO",
"4": "ANGLES MASERAS, ROGER",
"6": "NAVARRO SANTO, PAU",
"9": "TORRICO ALVAREZ, DIEGO",
"10": "MARTINEZ MARTINEZ, JOSE JAVIER",
"14": "RAMIREZ VARON, MARCO",
"17": "GARCIA CLAVERIAS, JOEL",
"19": "GRIÑAN SANCHEZ, PABLO",
"30": "BETANCOURT ROMERO, NICOLAS"
},
"Suplents": {
"5": "LOPEZ GILABERT, ARNAU",
"7": "VAZQUEZ MARTINEZ, KILIAN",
"8": "CERRATO MUÑOZ, ENEKO",
"11": "BACELLS DEMAYA, JOEL",
"12": "FERRER ORIVE, DIDAC",
"13": "ARAGONES GIMENEZ, FERRAN",
"16": "VALLDOSERA FOIX, IGNACIO",
"20": "FORNÓS GALLART, IKER"
},
"Equip Tècnic": [
"ARAGON MORENO, JOSE RICARDO",
"ROJAS GARRIGA, JORDI",
"SOLANELLAS GRISO, DAVID"
],
"Targetes": {
"9": {
"Nom": "TORRICO ALVAREZ, DIEGO",
"Minut": "35'",
"Targeta": "groga"
},
"12": {
"Nom": "FERRER ORIVE, DIDAC",
"Minut": "64'",
"Targeta": "groga"
}
}
}
},

0 REPLIES 0

Helpful resources

Announcements
Join our Fabric User Panel

Join our Fabric User Panel

This is your chance to engage directly with the engineering team behind Fabric and Power BI. Share your experiences and shape the future.

June 2025 Power BI Update Carousel

Power BI Monthly Update - June 2025

Check out the June 2025 Power BI update to learn about new features.

June 2025 community update carousel

Fabric Community Update - June 2025

Find out what's new and trending in the Fabric community.