# Copyright 2023 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import bigframes.pandas as bpd

df = bpd.read_gbq("bigquery-public-data.baseball.schedules")

Select a subset of the DF#

df = df[["gameId", "year", "homeTeamName", "awayTeamName", "duration_minutes"]]
df
# Here starts real execution, may take a while

Query job e6f77e72-820c-47ba-bd95-6b1ac360dc86 is DONE. 0 Bytes processed. Open Job

Query job 1280ea98-5503-4b32-899b-65ce4b4ad50f is DONE. 582.8 kB processed. Open Job

gameId year homeTeamName awayTeamName duration_minutes
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201

25 rows × 5 columns

[2431 rows x 5 columns in total]

Retrieve properties of the DF.#

gameId              string[pyarrow]
year                          Int64
homeTeamName        string[pyarrow]
awayTeamName        string[pyarrow]
duration_minutes              Int64
dtype: object
Index(['gameId', 'year', 'homeTeamName', 'awayTeamName', 'duration_minutes'], dtype='object')

Add a new column#

df = df.assign(title=df['homeTeamName'] + " vs " + df['awayTeamName'])
df

Query job e8a94ab7-7833-43ac-bf14-bfd4310260b9 is DONE. 582.8 kB processed. Open Job

Query job 8b1e4a6c-9f93-4588-9c34-ae324a42fd57 is DONE. 0 Bytes processed. Open Job

Query job 18db85e7-c94f-46ec-b981-5c582b5ce22a is DONE. 261.3 kB processed. Open Job

gameId year homeTeamName awayTeamName duration_minutes title
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167 Nationals vs Brewers
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172 Reds vs Brewers
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166 Orioles vs Rays
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182 Rockies vs Giants
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204 Twins vs Indians
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184 Blue Jays vs Orioles
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182 Yankees vs Mets
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191 Red Sox vs Rays
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201 Cardinals vs Pirates
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189 Rays vs Twins
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177 Rays vs Twins
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183 Royals vs Rays
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194 Astros vs Rays
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178 Dodgers vs Giants
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193 Tigers vs White Sox
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160 Cardinals vs Cubs
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169 Giants vs Cardinals
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251 Red Sox vs Twins
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151 Mets vs Braves
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153 Athletics vs Twins
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185 Twins vs Marlins
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180 Twins vs Yankees
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199 White Sox vs Orioles
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175 Diamondbacks vs Giants
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201 Braves vs Mets

25 rows × 6 columns

[2431 rows x 6 columns in total]

Manipulate the column#

df = df.rename(columns={"title": "headline"})
df

Query job ef76c434-c4bc-4b4c-bb06-61521fc85b15 is DONE. 0 Bytes processed. Open Job

Query job d3e413ee-c0c3-49fe-a2ad-f61d671593eb is DONE. 0 Bytes processed. Open Job

gameId year homeTeamName awayTeamName duration_minutes headline
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167 Nationals vs Brewers
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172 Reds vs Brewers
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166 Orioles vs Rays
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182 Rockies vs Giants
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204 Twins vs Indians
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184 Blue Jays vs Orioles
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182 Yankees vs Mets
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191 Red Sox vs Rays
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201 Cardinals vs Pirates
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189 Rays vs Twins
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177 Rays vs Twins
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183 Royals vs Rays
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194 Astros vs Rays
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178 Dodgers vs Giants
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193 Tigers vs White Sox
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160 Cardinals vs Cubs
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169 Giants vs Cardinals
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251 Red Sox vs Twins
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151 Mets vs Braves
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153 Athletics vs Twins
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185 Twins vs Marlins
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180 Twins vs Yankees
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199 White Sox vs Orioles
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175 Diamondbacks vs Giants
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201 Braves vs Mets

25 rows × 6 columns

[2431 rows x 6 columns in total]

df = df.drop(columns="headline")

Query job 051b3d23-5ab2-4022-adfc-f6553eb8532d is DONE. 0 Bytes processed. Open Job

Query job f7356669-04f8-46f9-bf9b-f8cd997d6162 is DONE. 213.3 kB processed. Open Job

gameId year homeTeamName awayTeamName duration_minutes
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201

25 rows × 5 columns

[2431 rows x 5 columns in total]

Drop Nan values#

Query job bd315bd7-1f10-4f1b-9997-10a294b1f464 is DONE. 232.7 kB processed. Open Job

Query job 972bf072-22c2-49ef-8764-1c1109dfc0a3 is DONE. 0 Bytes processed. Open Job

Query job 42c0cf8a-4276-479f-b8de-dcfce94ae42a is DONE. 213.3 kB processed. Open Job

gameId year homeTeamName awayTeamName duration_minutes
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201

25 rows × 5 columns

[2431 rows x 5 columns in total]

Join two DFs#

df1 = df[["gameId", "homeTeamName"]]
df1

Query job 3c859587-582d-4b68-8b35-7072b9a42346 is DONE. 0 Bytes processed. Open Job

Query job 15bf1d87-152a-45a5-b000-e8e72ce6a982 is DONE. 152.8 kB processed. Open Job

gameId homeTeamName
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 Nationals
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d Reds
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 Orioles
3 198f4eed-a29f-41e2-8623-cb261e5ab370 Rockies
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f Twins
5 4be9f735-a98e-4689-87ce-852cc3a1e79d Blue Jays
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 Yankees
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 Red Sox
8 7e1c2095-4fea-454c-8773-096ceb6fb05c Cardinals
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 Rays
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 Rays
11 6d2cab13-dd85-477a-8769-669069f85836 Royals
12 bca90342-7ddc-468e-b189-d43fad7528ec Astros
13 630f4f78-03cc-43c1-9e57-ababb9c11418 Dodgers
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 Tigers
15 46463c50-0f5c-4dca-a661-dd194464e791 Cardinals
16 392ad56d-972e-4f77-98e2-5f8577931cf8 Giants
17 307730fa-bbed-4221-b4e6-a2492f546fd5 Red Sox
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f Mets
19 723348ba-1645-43fc-9e22-92994f7a63bd Athletics
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 Twins
21 f2747230-7df5-4535-a475-a1c823d0d654 Twins
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 White Sox
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 Diamondbacks
24 95d548b6-2da8-4644-812e-b277fec5b91f Braves

25 rows × 2 columns

[2431 rows x 2 columns in total]

df2 = df[["gameId", "awayTeamName"]].head(2)
df2

Query job 262a8d65-8eb7-4769-b26d-4a1d93f19950 is DONE. 152.8 kB processed. Open Job

Query job a18f6c86-dbff-4846-8d21-8f8c1d700a80 is DONE. 0 Bytes processed. Open Job

Query job 9cc89303-be7a-4c34-b4c0-d1d75837a1e4 is DONE. 126 Bytes processed. Open Job

gameId awayTeamName
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 Brewers
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d Brewers

2 rows × 2 columns

[2 rows x 2 columns in total]

df1.merge(df2, on="gameId", how="inner")

Query job 1edf3455-802d-4b93-900b-9677cb43955a is DONE. 133.5 kB processed. Open Job

Query job 98cccaa5-e630-4edf-bc15-2823e89aecb6 is DONE. 0 Bytes processed. Open Job

Query job 91af749e-6afa-488a-83da-1257667460f0 is DONE. 143 Bytes processed. Open Job

gameId homeTeamName awayTeamName
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 Nationals Brewers
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d Reds Brewers

2 rows × 3 columns

[2 rows x 3 columns in total]

df1.merge(df2, on="gameId", how="outer")

Query job dfe4d1ec-9a3d-4877-ab39-bb6f1c38d070 is DONE. 133.5 kB processed. Open Job

Query job 6261a857-d256-4051-8af5-c6b04fb2795f is DONE. 0 Bytes processed. Open Job

Query job df400799-b054-4969-83a0-089fb2b25fdd is DONE. 152.9 kB processed. Open Job

gameId homeTeamName awayTeamName
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 Nationals Brewers
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d Reds Brewers
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 Orioles <NA>
3 198f4eed-a29f-41e2-8623-cb261e5ab370 Rockies <NA>
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f Twins <NA>
5 4be9f735-a98e-4689-87ce-852cc3a1e79d Blue Jays <NA>
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 Yankees <NA>
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 Red Sox <NA>
8 7e1c2095-4fea-454c-8773-096ceb6fb05c Cardinals <NA>
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 Rays <NA>
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 Rays <NA>
11 6d2cab13-dd85-477a-8769-669069f85836 Royals <NA>
12 bca90342-7ddc-468e-b189-d43fad7528ec Astros <NA>
13 630f4f78-03cc-43c1-9e57-ababb9c11418 Dodgers <NA>
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 Tigers <NA>
15 46463c50-0f5c-4dca-a661-dd194464e791 Cardinals <NA>
16 392ad56d-972e-4f77-98e2-5f8577931cf8 Giants <NA>
17 307730fa-bbed-4221-b4e6-a2492f546fd5 Red Sox <NA>
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f Mets <NA>
19 723348ba-1645-43fc-9e22-92994f7a63bd Athletics <NA>
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 Twins <NA>
21 f2747230-7df5-4535-a475-a1c823d0d654 Twins <NA>
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 White Sox <NA>
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 Diamondbacks <NA>
24 95d548b6-2da8-4644-812e-b277fec5b91f Braves <NA>

25 rows × 3 columns

[2431 rows x 3 columns in total]

df1.merge(df2, on="gameId", how="left")

Query job 9ae1e55b-36d0-4aef-ae39-67a3ad5fdb4d is DONE. 133.5 kB processed. Open Job

Query job 7a1822eb-7db9-4c54-abd5-74cb1cde6121 is DONE. 0 Bytes processed. Open Job

Query job 783d092c-5f79-4601-9365-633e48fac610 is DONE. 152.9 kB processed. Open Job

gameId homeTeamName awayTeamName
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 Nationals Brewers
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d Reds Brewers
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 Orioles <NA>
3 198f4eed-a29f-41e2-8623-cb261e5ab370 Rockies <NA>
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f Twins <NA>
5 4be9f735-a98e-4689-87ce-852cc3a1e79d Blue Jays <NA>
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 Yankees <NA>
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 Red Sox <NA>
8 7e1c2095-4fea-454c-8773-096ceb6fb05c Cardinals <NA>
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 Rays <NA>
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 Rays <NA>
11 6d2cab13-dd85-477a-8769-669069f85836 Royals <NA>
12 bca90342-7ddc-468e-b189-d43fad7528ec Astros <NA>
13 630f4f78-03cc-43c1-9e57-ababb9c11418 Dodgers <NA>
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 Tigers <NA>
15 46463c50-0f5c-4dca-a661-dd194464e791 Cardinals <NA>
16 392ad56d-972e-4f77-98e2-5f8577931cf8 Giants <NA>
17 307730fa-bbed-4221-b4e6-a2492f546fd5 Red Sox <NA>
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f Mets <NA>
19 723348ba-1645-43fc-9e22-92994f7a63bd Athletics <NA>
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 Twins <NA>
21 f2747230-7df5-4535-a475-a1c823d0d654 Twins <NA>
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 White Sox <NA>
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 Diamondbacks <NA>
24 95d548b6-2da8-4644-812e-b277fec5b91f Braves <NA>

25 rows × 3 columns

[2431 rows x 3 columns in total]

df1.merge(df2, on="gameId", how="right")

Query job ec1c442e-6ea1-461c-ada7-e3dd0454b0ca is DONE. 133.5 kB processed. Open Job

Query job 4ababa83-ad57-4520-b49d-e613256ae2f3 is DONE. 0 Bytes processed. Open Job

Query job f3db2d14-b877-46ea-8858-5cdb3706e26a is DONE. 143 Bytes processed. Open Job

gameId homeTeamName awayTeamName
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 Nationals Brewers
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d Reds Brewers

2 rows × 3 columns

[2 rows x 3 columns in total]

Concat two DFs#

Query job f0e1bda5-34f5-46e2-a396-289340074f82 is DONE. 0 Bytes processed. Open Job

Query job e7195b4a-f1ea-4bef-a4db-fa817144d249 is DONE. 213.3 kB processed. Open Job

gameId year homeTeamName awayTeamName duration_minutes
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201

25 rows × 5 columns

[4862 rows x 5 columns in total]

Access column through property#

Query job 0745cde9-9175-4e11-9721-f0c58fae90a2 is DONE. 79.9 kB processed. Open Job

Query job 4c7a65d6-63b7-44b6-8249-171139f907f5 is DONE. 0 Bytes processed. Open Job

Query job cee24fe1-cb33-4836-b158-90e293cbc057 is DONE. 60.5 kB processed. Open Job

0        Nationals
1             Reds
2          Orioles
3          Rockies
4            Twins
5        Blue Jays
6          Yankees
7          Red Sox
8        Cardinals
9             Rays
10            Rays
11          Royals
12          Astros
13         Dodgers
14          Tigers
15       Cardinals
16          Giants
17         Red Sox
18            Mets
19       Athletics
20           Twins
21           Twins
22       White Sox
23    Diamondbacks
24          Braves
Name: homeTeamName, dtype: string

Retrieve SQL#

print(df1.merge(df2, on="gameId", how="inner").sql)
WITH t0 AS (
  SELECT
    t9.`col_13`,
    t9.`col_14`,
    t9.`col_17`,
    t9.`bigframes_ordering_id`
  FROM `swast-scratch`._63cfa399614a54153cc386c27d6c0c6fdb249f9e.bqdf20240315_0f214503ed3e408abae057064ac2b4c2 AS t9
), t1 AS (
  SELECT
    t9.`col_13`,
    t9.`col_14`,
    t9.`col_16`,
    t9.`hidden_l_0`,
    t9.`hidden_r_0`
  FROM `swast-scratch`._63cfa399614a54153cc386c27d6c0c6fdb249f9e.bqdf20240315_22c51834c2b94bbc93da3d0ff27f980f AS t9
), t2 AS (
  SELECT
    t0.`col_13`,
    t0.`col_14`,
    t0.`col_17`,
    t0.`bigframes_ordering_id`
  FROM t0
), t3 AS (
  SELECT
    t1.`col_13`,
    t1.`col_14`,
    t1.`col_16`,
    t1.`hidden_l_0`,
    t1.`hidden_r_0`
  FROM t1
), t4 AS (
  SELECT
    t2.`col_13` AS `col_103`,
    t2.`col_14` AS `col_104`,
    t2.`col_17` AS `col_105`,
    t2.`bigframes_ordering_id` AS `hidden_r_0`
  FROM t2
), t5 AS (
  SELECT
    t3.`col_13` AS `col_100`,
    t3.`col_14` AS `col_101`,
    t3.`col_16` AS `col_102`,
    t3.`hidden_l_0`,
    t3.`hidden_r_0` AS `hidden_l_1`
  FROM t3
), t6 AS (
  SELECT
    coalesce(`col_101`, `col_104`) AS `col_106`,
    `col_102`,
    `col_105`,
    (
      row_number() OVER (ORDER BY `hidden_l_0` IS NULL ASC, `hidden_l_0` ASC, `hidden_r_0` IS NULL ASC, `hidden_r_0` ASC) - 1
    ) AS `bigframes_ordering_id`
  FROM t5
  INNER JOIN t4
    ON coalesce(t5.`col_101`, '$NULL_SENTINEL$') = coalesce(t4.`col_104`, '$NULL_SENTINEL$')
), t7 AS (
  SELECT
    t6.`col_106`,
    t6.`col_102`,
    t6.`col_105`,
    t6.`bigframes_ordering_id`
  FROM t6
)
SELECT
  t8.`col_106` AS `gameId`,
  t8.`col_102` AS `homeTeamName`,
  t8.`col_105` AS `awayTeamName`
FROM (
  SELECT
    t7.`col_106`,
    t7.`col_102`,
    t7.`col_105`
  FROM t7
) AS t8

Special Column Names#

df.rename(columns={"homeTeamName": "HOME    TEAM"})

Query job 9fcba646-219f-40ee-9792-d74af0ff7e22 is DONE. 0 Bytes processed. Open Job

Query job 657cdf62-f71e-482c-97f7-b66e4ac20e10 is DONE. 0 Bytes processed. Open Job

gameId year HOME TEAM awayTeamName duration_minutes
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201

25 rows × 5 columns

[2431 rows x 5 columns in total]

df.rename(columns={"homeTeamName": "homeTeam!@#$%col"})

Query job c90e0cd4-30e5-427c-8f5f-a0a8c778bc62 is DONE. 0 Bytes processed. Open Job

Query job 23bfdb6d-9411-484c-9766-93f76dfc1adc is DONE. 0 Bytes processed. Open Job

gameId year homeTeam!@#$%col awayTeamName duration_minutes
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201

25 rows × 5 columns

[2431 rows x 5 columns in total]

df3 = df.rename(columns={"homeTeamName": "team", "awayTeamName": "team"})
df3

Query job 63c2d27f-382c-4a43-8fc1-135d9fd66a54 is DONE. 0 Bytes processed. Open Job

Query job cc64185b-98e7-40d8-bf8e-2a3ea355ef67 is DONE. 0 Bytes processed. Open Job

gameId year team team duration_minutes
0 d60c6036-0ce1-4c90-8dd9-de3b403c92a8 2016 Nationals Brewers 167
1 af72a0b9-65f7-49fb-9b30-d505068bdf6d 2016 Reds Brewers 172
2 f57e1271-d217-400a-aea6-2e2d7d6a59a0 2016 Orioles Rays 166
3 198f4eed-a29f-41e2-8623-cb261e5ab370 2016 Rockies Giants 182
4 cb3ef033-dd57-41fd-b206-cdd3bc12c74f 2016 Twins Indians 204
5 4be9f735-a98e-4689-87ce-852cc3a1e79d 2016 Blue Jays Orioles 184
6 0b2de8c3-11d9-4f0f-a186-25b59f34a5d8 2016 Yankees Mets 182
7 60d80663-6ced-44aa-aad9-0f4bf8d3b4d2 2016 Red Sox Rays 191
8 7e1c2095-4fea-454c-8773-096ceb6fb05c 2016 Cardinals Pirates 201
9 f7f24ce3-7f9d-4e8a-986e-095db847c4c1 2016 Rays Twins 189
10 5c26e7fc-c99f-48b4-92c1-4a7208c8cfe9 2016 Rays Twins 177
11 6d2cab13-dd85-477a-8769-669069f85836 2016 Royals Rays 183
12 bca90342-7ddc-468e-b189-d43fad7528ec 2016 Astros Rays 194
13 630f4f78-03cc-43c1-9e57-ababb9c11418 2016 Dodgers Giants 178
14 c0cf1376-1115-4a2f-b457-3f82bbc41a89 2016 Tigers White Sox 193
15 46463c50-0f5c-4dca-a661-dd194464e791 2016 Cardinals Cubs 160
16 392ad56d-972e-4f77-98e2-5f8577931cf8 2016 Giants Cardinals 169
17 307730fa-bbed-4221-b4e6-a2492f546fd5 2016 Red Sox Twins 251
18 1cbc558f-7615-4fa9-bf97-7ccd62040d6f 2016 Mets Braves 151
19 723348ba-1645-43fc-9e22-92994f7a63bd 2016 Athletics Twins 153
20 ffbd6ecc-82e1-4e5d-9bd1-4ea210be5992 2016 Twins Marlins 185
21 f2747230-7df5-4535-a475-a1c823d0d654 2016 Twins Yankees 180
22 db3b6f35-a7a4-430a-8703-2b2f25103e17 2016 White Sox Orioles 199
23 5fc8c6f0-a70e-4d1b-877f-eb1ec8e6f636 2016 Diamondbacks Giants 175
24 95d548b6-2da8-4644-812e-b277fec5b91f 2016 Braves Mets 201

25 rows × 5 columns

[2431 rows x 5 columns in total]

Query job 089a657b-e651-4b17-a4ce-4d7be682a49c is DONE. 0 Bytes processed. Open Job

Query job 740ad61e-cf14-41f1-ae4e-23d1fb8ed155 is DONE. 82.0 kB processed. Open Job

team team
0 Nationals Brewers
1 Reds Brewers
2 Orioles Rays
3 Rockies Giants
4 Twins Indians
5 Blue Jays Orioles
6 Yankees Mets
7 Red Sox Rays
8 Cardinals Pirates
9 Rays Twins
10 Rays Twins
11 Royals Rays
12 Astros Rays
13 Dodgers Giants
14 Tigers White Sox
15 Cardinals Cubs
16 Giants Cardinals
17 Red Sox Twins
18 Mets Braves
19 Athletics Twins
20 Twins Marlins
21 Twins Yankees
22 White Sox Orioles
23 Diamondbacks Giants
24 Braves Mets

25 rows × 2 columns

[2431 rows x 2 columns in total]

Binary Operation#

df4 = df[["year", "duration_minutes"]]
df4

Query job d3b3cd83-d9cf-4c5b-9015-e3979e0857f3 is DONE. 0 Bytes processed. Open Job

Query job e4d99a58-738d-42af-863e-d1262a32c93c is DONE. 77.8 kB processed. Open Job

year duration_minutes
0 2016 167
1 2016 172
2 2016 166
3 2016 182
4 2016 204
5 2016 184
6 2016 182
7 2016 191
8 2016 201
9 2016 189
10 2016 177
11 2016 183
12 2016 194
13 2016 178
14 2016 193
15 2016 160
16 2016 169
17 2016 251
18 2016 151
19 2016 153
20 2016 185
21 2016 180
22 2016 199
23 2016 175
24 2016 201

25 rows × 2 columns

[2431 rows x 2 columns in total]

Query job e5c2b908-c539-4349-8368-50e61d8e19cd is DONE. 0 Bytes processed. Open Job

Query job c5a563d2-9780-4c51-996b-bf0242b96e39 is DONE. 77.8 kB processed. Open Job

year duration_minutes
0 2017 168
1 2017 173
2 2017 167
3 2017 183
4 2017 205
5 2017 185
6 2017 183
7 2017 192
8 2017 202
9 2017 190
10 2017 178
11 2017 184
12 2017 195
13 2017 179
14 2017 194
15 2017 161
16 2017 170
17 2017 252
18 2017 152
19 2017 154
20 2017 186
21 2017 181
22 2017 200
23 2017 176
24 2017 202

25 rows × 2 columns

[2431 rows x 2 columns in total]

Download the result as (in-memory) pandas DataFrame#

dfp = df4.to_pandas()
dfp

Query job b6495f3d-619c-429e-8904-5cdc4957d09f is DONE. 77.8 kB processed. Open Job

year duration_minutes
0 2016 167
1 2016 172
2 2016 166
3 2016 182
4 2016 204
... ... ...
2426 2016 199
2427 2016 181
2428 2016 205
2429 2016 203
2430 2016 182

2431 rows × 2 columns