CDC covid cases data
https://data.cdc.gov/Case-Surveillance/COVID-19-Case-Surveillance-Public-Use-Data-with-Ge/n8mc-b4w4/about_data
Example of API url: https://data.cdc.gov/resource/n8mc-b4w4.json
import pandas as pd
import seaborn as sns
csv_url = 'https://data.cdc.gov/resource/n8mc-b4w4.csv'
df = pd.read_csv(csv_url)
df.head()
0 |
2020-09 |
TN |
47 |
KNOX |
47093.0 |
50 to 64 years |
Female |
White |
Non-Hispanic/Latino |
0.0 |
0.0 |
Missing |
Yes |
Laboratory-confirmed case |
Symptomatic |
No |
Missing |
Missing |
NaN |
1 |
2024-01 |
NM |
35 |
BERNALILLO |
35001.0 |
18 to 49 years |
Female |
Missing |
Hispanic/Latino |
NaN |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
Unknown |
Missing |
Missing |
NaN |
2 |
2022-01 |
NY |
36 |
MONROE |
36055.0 |
18 to 49 years |
Female |
Unknown |
Unknown |
NaN |
0.0 |
Missing |
Missing |
Laboratory-confirmed case |
Symptomatic |
Missing |
Missing |
No |
NaN |
3 |
2021-12 |
PA |
42 |
MONTGOMERY |
42091.0 |
18 to 49 years |
Male |
White |
Non-Hispanic/Latino |
0.0 |
0.0 |
Missing |
Missing |
Laboratory-confirmed case |
Symptomatic |
Unknown |
Unknown |
Unknown |
NaN |
4 |
2023-01 |
MA |
25 |
BRISTOL |
25005.0 |
50 to 64 years |
Male |
White |
Non-Hispanic/Latino |
0.0 |
NaN |
Missing |
Missing |
Probable Case |
Missing |
Missing |
Missing |
Missing |
NaN |
995 |
2021-05 |
TX |
48 |
DENTON |
48121.0 |
18 to 49 years |
Female |
Missing |
Unknown |
NaN |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
Missing |
Missing |
Missing |
NaN |
996 |
2021-01 |
NY |
36 |
NEW YORK |
36061.0 |
18 to 49 years |
Female |
White |
Non-Hispanic/Latino |
0.0 |
0.0 |
Missing |
Missing |
Laboratory-confirmed case |
Symptomatic |
Missing |
Missing |
Missing |
NaN |
997 |
2022-10 |
CA |
6 |
RIVERSIDE |
6065.0 |
65+ years |
Female |
White |
Non-Hispanic/Latino |
NaN |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Unknown |
No |
Missing |
Missing |
NaN |
998 |
2022-07 |
NC |
37 |
MECKLENBURG |
37119.0 |
18 to 49 years |
Female |
Black |
Unknown |
0.0 |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Unknown |
Unknown |
Unknown |
No |
NaN |
999 |
2022-05 |
AZ |
4 |
MARICOPA |
4013.0 |
18 to 49 years |
Female |
Missing |
Non-Hispanic/Latino |
NaN |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
No |
Missing |
Missing |
NaN |
Change the limit for the number of rows retrieved, and the offset
df_1200 = pd.read_csv('https://data.cdc.gov/resource/n8mc-b4w4.csv?$limit=1200')
df_1200.tail()
1195 |
2021-07 |
FL |
12 |
SARASOTA |
12115.0 |
50 to 64 years |
Female |
NaN |
NaN |
0.0 |
0.0 |
Missing |
Missing |
Probable Case |
Symptomatic |
No |
Missing |
No |
NaN |
1196 |
2021-01 |
CA |
6 |
SOLANO |
6095.0 |
18 to 49 years |
Male |
Black |
Non-Hispanic/Latino |
NaN |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Unknown |
Missing |
Missing |
Missing |
NaN |
1197 |
2022-01 |
IN |
18 |
MARION |
18097.0 |
50 to 64 years |
Female |
White |
Non-Hispanic/Latino |
0.0 |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
No |
Missing |
No |
NaN |
1198 |
2022-09 |
NJ |
34 |
BURLINGTON |
34005.0 |
18 to 49 years |
Male |
White |
Non-Hispanic/Latino |
0.0 |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
No |
Missing |
No |
NaN |
1199 |
2020-11 |
MA |
25 |
BRISTOL |
25005.0 |
18 to 49 years |
Female |
Missing |
Missing |
0.0 |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
Missing |
Missing |
Missing |
NaN |
df_1200_with_offset = pd.read_csv('https://data.cdc.gov/resource/n8mc-b4w4.csv?$limit=1200&$offset=1200')
df_1200_with_offset.tail()
1195 |
2021-06 |
CA |
6 |
STANISLAUS |
6099.0 |
18 to 49 years |
Female |
Unknown |
Unknown |
NaN |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Unknown |
No |
Missing |
Missing |
NaN |
1196 |
2020-10 |
NC |
37 |
GASTON |
37071.0 |
65+ years |
Female |
Unknown |
Unknown |
0.0 |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Unknown |
Unknown |
Unknown |
No |
NaN |
1197 |
2021-01 |
CO |
8 |
MESA |
8077.0 |
18 to 49 years |
Male |
White |
Non-Hispanic/Latino |
NaN |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
No |
Missing |
Missing |
NaN |
1198 |
2023-08 |
SC |
45 |
AIKEN |
45003.0 |
65+ years |
Male |
White |
Non-Hispanic/Latino |
NaN |
NaN |
Missing |
Missing |
Probable Case |
Missing |
Missing |
Missing |
NaN |
NaN |
1199 |
2022-01 |
OH |
39 |
WARREN |
39165.0 |
65+ years |
Female |
NaN |
NaN |
NaN |
NaN |
Missing |
Missing |
Probable Case |
Missing |
Missing |
Missing |
Unknown |
NaN |
pd.read_csv('https://data.cdc.gov/resource/n8mc-b4w4.csv?$limit=50000').tail()
49995 |
2022-12 |
TX |
48 |
HARRIS |
48201.0 |
18 to 49 years |
Male |
White |
Non-Hispanic/Latino |
NaN |
NaN |
Missing |
Missing |
Probable Case |
Missing |
Unknown |
Missing |
Missing |
NaN |
49996 |
2021-12 |
FL |
12 |
LAKE |
12069.0 |
65+ years |
Male |
White |
Non-Hispanic/Latino |
0.0 |
0.0 |
Missing |
Missing |
Laboratory-confirmed case |
Symptomatic |
No |
Missing |
No |
NaN |
49997 |
2020-12 |
GA |
13 |
GWINNETT |
13135.0 |
18 to 49 years |
Female |
Black |
Non-Hispanic/Latino |
NaN |
0.0 |
Missing |
Missing |
Probable Case |
Symptomatic |
Missing |
Missing |
Missing |
NaN |
49998 |
2021-01 |
NJ |
34 |
MONMOUTH |
34025.0 |
0 - 17 years |
Male |
White |
Non-Hispanic/Latino |
0.0 |
0.0 |
Missing |
Missing |
Probable Case |
Symptomatic |
No |
Missing |
No |
NaN |
49999 |
2022-06 |
VA |
51 |
ARLINGTON |
51013.0 |
18 to 49 years |
Female |
Unknown |
NaN |
0.0 |
NaN |
Missing |
Missing |
Laboratory-confirmed case |
Missing |
Missing |
Missing |
Missing |
NaN |