# NCEI
<br>

- 지점정보
    - 링크 내용은 동일함
    - https://www.ncei.noaa.gov/pub/data/noaa/isd-history.txt(내용확인)
    - https://www.ncei.noaa.gov/pub/data/noaa/isd-history.csv(파일다운로드)
- 국가 코드
    - Country list
        - 국가명과 국가 2글자 표현 짝 정리된 것
        - 후에 요청인자 중 stn 구성요소인 지점코드값의 국가 부분을 해석하는데에 사용
        - 293개국 존재
- 파일 리스트
    - File list
        - 파일목록
        - 파일명과 파일 크기가 나열됨
        - 후술될 요청인자 중 stn의 구성요소인 지점코드 값으로 활용할 수 있음
            - 국가 2글자, 망구분 1글자, 지점번호 9글자를 가져올 소스
        - 122236개 있음
- 실제 파일 리스트
    - data_climate/gsom-latest 내부에 존재하는 파일들
    - 122041개 있음

## 활용 library

In [1]:
import pandas as pd
import numpy as np
import os

## Country List와 File List 병합
- FileList의 파일명 5,6 번째 글자와 Country List의 FIPS ID가 동일하면 후자의 Country Name을 추가해준다

In [2]:
dfCountry = pd.read_csv('data_climate/country_list.csv', sep = ',',
                        encoding = 'euc-kr', engine = 'python')
dfFileList = pd.read_csv('data_climate/file_list.csv', sep = ',',
                  encoding = 'euc-kr', engine = 'python')

In [3]:
dfCountry

Unnamed: 0,FIPS ID,COUNTRY NAME
0,AA,ARUBA
1,AC,ANTIGUA AND BARBUDA
2,AF,AFGHANISTAN
3,AG,ALGERIA
4,AI,ASCENSION ISLAND
...,...,...
288,YY,"ST. MARTEEN, ST. EUSTATIUS, AND SABA"
289,ZA,ZAMBIA
290,ZI,ZIMBABWE
291,ZM,SAMOA


In [4]:
dfFileList

Unnamed: 0,FILE,SIZE
0,gsom_ACW00011604.csv,4036
1,gsom_ACW00011647.csv,34313
2,gsom_AE000041196.csv,130742
3,gsom_AEM00041194.csv,100242
4,gsom_AEM00041217.csv,85259
...,...,...
122231,gsom_ZI000067965.csv,114617
122232,gsom_ZI000067969.csv,116596
122233,gsom_ZI000067975.csv,200883
122234,gsom_ZI000067977.csv,84153


In [5]:
dfFileList['ID'] = dfFileList['FILE'].str[5:7]
dfFileList

Unnamed: 0,FILE,SIZE,ID
0,gsom_ACW00011604.csv,4036,AC
1,gsom_ACW00011647.csv,34313,AC
2,gsom_AE000041196.csv,130742,AE
3,gsom_AEM00041194.csv,100242,AE
4,gsom_AEM00041217.csv,85259,AE
...,...,...,...
122231,gsom_ZI000067965.csv,114617,ZI
122232,gsom_ZI000067969.csv,116596,ZI
122233,gsom_ZI000067975.csv,200883,ZI
122234,gsom_ZI000067977.csv,84153,ZI


In [6]:
dfCountryList = pd.merge(dfFileList, dfCountry,
                         how = 'left',
                         left_on = 'ID',
                         right_on = 'FIPS ID')
dfCountryList

Unnamed: 0,FILE,SIZE,ID,FIPS ID,COUNTRY NAME
0,gsom_ACW00011604.csv,4036,AC,AC,ANTIGUA AND BARBUDA
1,gsom_ACW00011647.csv,34313,AC,AC,ANTIGUA AND BARBUDA
2,gsom_AE000041196.csv,130742,AE,,
3,gsom_AEM00041194.csv,100242,AE,,
4,gsom_AEM00041217.csv,85259,AE,,
...,...,...,...,...,...
122231,gsom_ZI000067965.csv,114617,ZI,ZI,ZIMBABWE
122232,gsom_ZI000067969.csv,116596,ZI,ZI,ZIMBABWE
122233,gsom_ZI000067975.csv,200883,ZI,ZI,ZIMBABWE
122234,gsom_ZI000067977.csv,84153,ZI,ZI,ZIMBABWE


In [7]:
dfCountryList.isnull().sum()

FILE            0
SIZE            0
ID              0
FIPS ID         6
COUNTRY NAME    6
dtype: int64

In [8]:
dfCountryList[dfCountryList['FIPS ID'].isnull()]

Unnamed: 0,FILE,SIZE,ID,FIPS ID,COUNTRY NAME
2,gsom_AE000041196.csv,130742,AE,,
3,gsom_AEM00041194.csv,100242,AE,,
4,gsom_AEM00041217.csv,85259,AE,,
5,gsom_AEM00041218.csv,48310,AE,,
46733,gsom_NNM00078866.csv,54757,NN,,
52317,gsom_UCM00078988.csv,56684,UC,,


In [9]:
CountryNull = dfCountryList[dfCountryList['FIPS ID'].isnull()]['ID'].unique()
CountryNull

array(['AE', 'NN', 'UC'], dtype=object)

In [10]:
dfCountryList['FILENM'] = dfCountryList['FILE'].str[5:]
dfCountryList

Unnamed: 0,FILE,SIZE,ID,FIPS ID,COUNTRY NAME,FILENM
0,gsom_ACW00011604.csv,4036,AC,AC,ANTIGUA AND BARBUDA,ACW00011604.csv
1,gsom_ACW00011647.csv,34313,AC,AC,ANTIGUA AND BARBUDA,ACW00011647.csv
2,gsom_AE000041196.csv,130742,AE,,,AE000041196.csv
3,gsom_AEM00041194.csv,100242,AE,,,AEM00041194.csv
4,gsom_AEM00041217.csv,85259,AE,,,AEM00041217.csv
...,...,...,...,...,...,...
122231,gsom_ZI000067965.csv,114617,ZI,ZI,ZIMBABWE,ZI000067965.csv
122232,gsom_ZI000067969.csv,116596,ZI,ZI,ZIMBABWE,ZI000067969.csv
122233,gsom_ZI000067975.csv,200883,ZI,ZI,ZIMBABWE,ZI000067975.csv
122234,gsom_ZI000067977.csv,84153,ZI,ZI,ZIMBABWE,ZI000067977.csv


## NCEI 파일 목록을 가져오기

In [11]:
path = 'data_climate/gsom-latest'
file_list = os.listdir(path)
file_list_csv = [file for file in file_list if file.endswith(".csv")]

In [12]:
len(file_list_csv)

122041

가지고 있는 파일과 파일리스트를 merge하여 파일 보유 정보를 확인하기

In [13]:
dfRealFileList = pd.DataFrame(file_list_csv, columns = ['RealFileNM'])

In [14]:
dfRealFileList

Unnamed: 0,RealFileNM
0,ACW00011604.csv
1,ACW00011647.csv
2,AE000041196.csv
3,AEM00041194.csv
4,AEM00041217.csv
...,...
122036,ZI000067969.csv
122037,ZI000067975.csv
122038,ZI000067977.csv
122039,ZI000067983.csv


In [15]:
dfFinalFileList = pd.merge(dfRealFileList, dfCountryList,
                           how = 'left',
                           left_on = 'RealFileNM',
                           right_on = 'FILENM')
dfFinalFileList

Unnamed: 0,RealFileNM,FILE,SIZE,ID,FIPS ID,COUNTRY NAME,FILENM
0,ACW00011604.csv,gsom_ACW00011604.csv,4036.0,AC,AC,ANTIGUA AND BARBUDA,ACW00011604.csv
1,ACW00011647.csv,gsom_ACW00011647.csv,34313.0,AC,AC,ANTIGUA AND BARBUDA,ACW00011647.csv
2,AE000041196.csv,gsom_AE000041196.csv,130742.0,AE,,,AE000041196.csv
3,AEM00041194.csv,gsom_AEM00041194.csv,100242.0,AE,,,AEM00041194.csv
4,AEM00041217.csv,gsom_AEM00041217.csv,85259.0,AE,,,AEM00041217.csv
...,...,...,...,...,...,...,...
122036,ZI000067969.csv,gsom_ZI000067969.csv,116596.0,ZI,ZI,ZIMBABWE,ZI000067969.csv
122037,ZI000067975.csv,gsom_ZI000067975.csv,200883.0,ZI,ZI,ZIMBABWE,ZI000067975.csv
122038,ZI000067977.csv,gsom_ZI000067977.csv,84153.0,ZI,ZI,ZIMBABWE,ZI000067977.csv
122039,ZI000067983.csv,gsom_ZI000067983.csv,193672.0,ZI,ZI,ZIMBABWE,ZI000067983.csv


In [16]:
dfFinalFileList.isnull().sum()

RealFileNM       0
FILE            10
SIZE            10
ID              10
FIPS ID         16
COUNTRY NAME    16
FILENM          10
dtype: int64

In [17]:
# 파일리스트를 참고해도 파악 안되는 곳
# 필요시 수기로 찾아봐야 함
dfFinalFileList[dfFinalFileList['FIPS ID'].isnull()]

Unnamed: 0,RealFileNM,FILE,SIZE,ID,FIPS ID,COUNTRY NAME,FILENM
2,AE000041196.csv,gsom_AE000041196.csv,130742.0,AE,,,AE000041196.csv
3,AEM00041194.csv,gsom_AEM00041194.csv,100242.0,AE,,,AEM00041194.csv
4,AEM00041217.csv,gsom_AEM00041217.csv,85259.0,AE,,,AEM00041217.csv
5,AEM00041218.csv,gsom_AEM00041218.csv,48310.0,AE,,,AEM00041218.csv
46730,NNM00078866.csv,gsom_NNM00078866.csv,54757.0,NN,,,NNM00078866.csv
52313,UCM00078988.csv,gsom_UCM00078988.csv,56684.0,UC,,,UCM00078988.csv
56124,US1AZYV0208.csv,,,,,,
59946,US1COLR1064.csv,,,,,,
72280,US1MNHN0366.csv,,,,,,
74840,US1NCBC0173.csv,,,,,,


## 모든 지역 위치정보 가져오기
- 모든 파일 첫 줄을 가져오기

In [18]:
dfRealFileList

Unnamed: 0,RealFileNM
0,ACW00011604.csv
1,ACW00011647.csv
2,AE000041196.csv
3,AEM00041194.csv
4,AEM00041217.csv
...,...
122036,ZI000067969.csv
122037,ZI000067975.csv
122038,ZI000067977.csv
122039,ZI000067983.csv


In [19]:
file_list_csv

['ACW00011604.csv',
 'ACW00011647.csv',
 'AE000041196.csv',
 'AEM00041194.csv',
 'AEM00041217.csv',
 'AEM00041218.csv',
 'AF000040930.csv',
 'AFM00040938.csv',
 'AFM00040948.csv',
 'AFM00040990.csv',
 'AG000060390.csv',
 'AG000060590.csv',
 'AG000060611.csv',
 'AG000060680.csv',
 'AGE00135039.csv',
 'AGE00147704.csv',
 'AGE00147705.csv',
 'AGE00147706.csv',
 'AGE00147707.csv',
 'AGE00147708.csv',
 'AGE00147709.csv',
 'AGE00147710.csv',
 'AGE00147711.csv',
 'AGE00147712.csv',
 'AGE00147713.csv',
 'AGE00147714.csv',
 'AGE00147715.csv',
 'AGE00147716.csv',
 'AGE00147717.csv',
 'AGE00147718.csv',
 'AGE00147719.csv',
 'AGE00147720.csv',
 'AGE00147780.csv',
 'AGE00147794.csv',
 'AGM00060351.csv',
 'AGM00060353.csv',
 'AGM00060355.csv',
 'AGM00060360.csv',
 'AGM00060367.csv',
 'AGM00060369.csv',
 'AGM00060387.csv',
 'AGM00060402.csv',
 'AGM00060403.csv',
 'AGM00060405.csv',
 'AGM00060410.csv',
 'AGM00060415.csv',
 'AGM00060417.csv',
 'AGM00060419.csv',
 'AGM00060421.csv',
 'AGM00060423.csv',


In [20]:
dfLocation = dfFinalFileList.copy()
dfLocation

Unnamed: 0,RealFileNM,FILE,SIZE,ID,FIPS ID,COUNTRY NAME,FILENM
0,ACW00011604.csv,gsom_ACW00011604.csv,4036.0,AC,AC,ANTIGUA AND BARBUDA,ACW00011604.csv
1,ACW00011647.csv,gsom_ACW00011647.csv,34313.0,AC,AC,ANTIGUA AND BARBUDA,ACW00011647.csv
2,AE000041196.csv,gsom_AE000041196.csv,130742.0,AE,,,AE000041196.csv
3,AEM00041194.csv,gsom_AEM00041194.csv,100242.0,AE,,,AEM00041194.csv
4,AEM00041217.csv,gsom_AEM00041217.csv,85259.0,AE,,,AEM00041217.csv
...,...,...,...,...,...,...,...
122036,ZI000067969.csv,gsom_ZI000067969.csv,116596.0,ZI,ZI,ZIMBABWE,ZI000067969.csv
122037,ZI000067975.csv,gsom_ZI000067975.csv,200883.0,ZI,ZI,ZIMBABWE,ZI000067975.csv
122038,ZI000067977.csv,gsom_ZI000067977.csv,84153.0,ZI,ZI,ZIMBABWE,ZI000067977.csv
122039,ZI000067983.csv,gsom_ZI000067983.csv,193672.0,ZI,ZI,ZIMBABWE,ZI000067983.csv


In [21]:
dfLocation.drop(['FILE', 'SIZE', 'FIPS ID', 'FILENM'], axis = 1, inplace = True)
dfLocation['Name'] = dfLocation['RealFileNM'].str[:-4]
dfLocation

Unnamed: 0,RealFileNM,ID,COUNTRY NAME,Name
0,ACW00011604.csv,AC,ANTIGUA AND BARBUDA,ACW00011604
1,ACW00011647.csv,AC,ANTIGUA AND BARBUDA,ACW00011647
2,AE000041196.csv,AE,,AE000041196
3,AEM00041194.csv,AE,,AEM00041194
4,AEM00041217.csv,AE,,AEM00041217
...,...,...,...,...
122036,ZI000067969.csv,ZI,ZIMBABWE,ZI000067969
122037,ZI000067975.csv,ZI,ZIMBABWE,ZI000067975
122038,ZI000067977.csv,ZI,ZIMBABWE,ZI000067977
122039,ZI000067983.csv,ZI,ZIMBABWE,ZI000067983


In [62]:
dfLocation.to_csv('data_climate/FiletoCountry.csv', index = False)

In [35]:
def location_collect(num1 = None, num2 = None):
    path = 'data_climate/gsom-latest/'
    flag = False

    for file in file_list_csv[num1: num2]:

        # 활용할 csv
        dfTMP = pd.read_csv(path + file)
#         print('1')
        # csv 처음 불러왔을 때
        if flag == False:
            print('0')
            # 결과 df 변수에 현재의 첫 번째 행을 넣는다.
            df = dfTMP.loc[0:0, :]
            # flag를 변경하여 이 if문에 다시 들어오지 않는다.
            flag = True
            # 확인용 출력
#             print('길이: ', len(df))
        # csv 처음 불러온 것이 아닐 때
        else:
#             print('2')
            # 결과 df와 지금 df의 첫 번째 행을 이어붙인다.
            df = pd.concat([df, dfTMP.loc[0:0, :]], axis = 0)
#             print('길이: ', len(df))
#             print('3')
    df.reset_index(inplace = True, drop = True)
    print(len(df))
    return df

In [23]:
dfSample = location_collect(0, 1000)
dfSample

0


Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,CDSD,CDSD_ATTRIBUTES,CLDD,CLDD_ATTRIBUTES,...,WSF1,WSF1_ATTRIBUTES,WSF2,WSF2_ATTRIBUTES,WSF5,WSF5_ATTRIBUTES,WSFG,WSFG_ATTRIBUTES,WSFM,WSFM_ATTRIBUTES
0,ACW00011604,1949-01,17.11667,-61.78333,10.1,"ST JOHNS COOLIDGE FIELD, AC",182.6,,182.6,",X",...,,,,,,,,,,
1,ACW00011647,1957-09,17.13333,-61.78333,19.2,"ST JOHNS, AC",,,,,...,,,,,,,,,,
2,AE000041196,1944-04,25.33300,55.51700,34.0,"SHARJAH INTER. AIRP, AE",,,184.1,"4,I",...,,,,,,,,,,
3,AEM00041194,1983-01,25.25500,55.36400,10.4,"DUBAI INTERNATIONAL, AE",,,,,...,,,,,,,,,,
4,AEM00041217,1983-06,24.43300,54.65100,26.8,"ABU DHABI INTERNATIONAL, AE",,,,,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
995,ASN00007156,1910-05,-27.95780,116.33830,400.0,"TARDIE STATION, AS",,,,,...,,,,,,,,,,
996,ASN00007157,1913-01,-27.77440,117.01560,450.0,"DALGARANGA, AS",,,,,...,,,,,,,,,,
997,ASN00007158,1968-09,-27.61670,118.93330,,"INGLEWOOD, AS",,,,,...,,,,,,,,,,
998,ASN00007159,1750-03,-27.54860,118.21720,450.0,"YARRAQUIN, AS",,,,,...,,,,,,,,,,


In [24]:
dfSample.to_csv('data_climate/dfLocation_sample.csv', index = False)

In [25]:
tmp = pd.read_csv('data_climate/dfLocation_sample.csv')
tmp

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,CDSD,CDSD_ATTRIBUTES,CLDD,CLDD_ATTRIBUTES,...,WSF1,WSF1_ATTRIBUTES,WSF2,WSF2_ATTRIBUTES,WSF5,WSF5_ATTRIBUTES,WSFG,WSFG_ATTRIBUTES,WSFM,WSFM_ATTRIBUTES
0,ACW00011604,1949-01,17.11667,-61.78333,10.1,"ST JOHNS COOLIDGE FIELD, AC",182.6,,182.6,",X",...,,,,,,,,,,
1,ACW00011647,1957-09,17.13333,-61.78333,19.2,"ST JOHNS, AC",,,,,...,,,,,,,,,,
2,AE000041196,1944-04,25.33300,55.51700,34.0,"SHARJAH INTER. AIRP, AE",,,184.1,"4,I",...,,,,,,,,,,
3,AEM00041194,1983-01,25.25500,55.36400,10.4,"DUBAI INTERNATIONAL, AE",,,,,...,,,,,,,,,,
4,AEM00041217,1983-06,24.43300,54.65100,26.8,"ABU DHABI INTERNATIONAL, AE",,,,,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
995,ASN00007156,1910-05,-27.95780,116.33830,400.0,"TARDIE STATION, AS",,,,,...,,,,,,,,,,
996,ASN00007157,1913-01,-27.77440,117.01560,450.0,"DALGARANGA, AS",,,,,...,,,,,,,,,,
997,ASN00007158,1968-09,-27.61670,118.93330,,"INGLEWOOD, AS",,,,,...,,,,,,,,,,
998,ASN00007159,1750-03,-27.54860,118.21720,450.0,"YARRAQUIN, AS",,,,,...,,,,,,,,,,


In [36]:
df1 = location_collect(0, 10000)

0
10000


In [37]:
df1

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,CDSD,CDSD_ATTRIBUTES,CLDD,CLDD_ATTRIBUTES,...,WSF1,WSF1_ATTRIBUTES,WSF2,WSF2_ATTRIBUTES,WSF5,WSF5_ATTRIBUTES,WSFG,WSFG_ATTRIBUTES,WSFM,WSFM_ATTRIBUTES
0,ACW00011604,1949-01,17.11667,-61.78333,10.1,"ST JOHNS COOLIDGE FIELD, AC",182.6,,182.6,",X",...,,,,,,,,,,
1,ACW00011647,1957-09,17.13333,-61.78333,19.2,"ST JOHNS, AC",,,,,...,,,,,,,,,,
2,AE000041196,1944-04,25.33300,55.51700,34.0,"SHARJAH INTER. AIRP, AE",,,184.1,"4,I",...,,,,,,,,,,
3,AEM00041194,1983-01,25.25500,55.36400,10.4,"DUBAI INTERNATIONAL, AE",,,,,...,,,,,,,,,,
4,AEM00041217,1983-06,24.43300,54.65100,26.8,"ABU DHABI INTERNATIONAL, AE",,,,,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,ASN00051026,1905-09,-31.56290,146.71810,215.0,"HERMIDALE TANK, AS",,,,,...,,,,,,,,,,
9996,ASN00051027,1928-02,-31.10000,147.30000,,"ILLABUNDA, AS",,,,,...,,,,,,,,,,
9997,ASN00051028,1899-08,-31.51670,147.38330,177.0,"NYNGAN KALUGA, AS",,,,,...,,,,,,,,,,
9998,ASN00051029,1885-07,-31.43330,147.43330,174.0,"NYNGAN MERRYANBONE, AS",,,,,...,,,,,,,,,,


In [38]:
df1.to_csv('data_climate/dfLocation_1.csv')

In [26]:
df2 = location_collect(10000, 20000)

0


In [27]:
df2

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,TSUN,TSUN_ATTRIBUTES,WDFM,WDFM_ATTRIBUTES,WSFM,WSFM_ATTRIBUTES,WDF1,WDF1_ATTRIBUTES,WSF1,WSF1_ATTRIBUTES
0,ASN00051031,1889-03,-31.6395,147.3160,179.0,"NYNGAN CANONBAR, AS",5.0,",a",5.0,",a",...,,,,,,,,,,
1,ASN00051032,1886-01,-31.2000,148.7000,298.7,"MOUNT TENANDRA, AS",5.0,",a",2.0,",a",...,,,,,,,,,,
2,ASN00051033,1750-03,-31.8576,147.1343,182.0,"NYNGAN MUDALL, AS",4.0,"2,a",3.0,"2,a",...,,,,,,,,,,
3,ASN00051034,1750-03,-31.4986,147.6865,192.0,"WARREN MUMBLEBONE, AS",3.0,"2,a",3.0,"2,a",...,,,,,,,,,,
4,ASN00051035,1896-01,-32.1500,148.1000,,"MUNGERIBAR, AS",0.0,",a",0.0,",a",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,BR002749033,1976-05,-27.3900,-49.3700,550.0,"VIDAL RAMOS, BR",11.0,",I",10.0,",I",...,,,,,,,,,,
9996,BR002749034,1976-05,-27.5100,-49.2900,700.0,"LEOBERTO LEAL, BR",15.0,",I",9.0,",I",...,,,,,,,,,,
9997,BR002749035,1976-09,-27.7400,-49.9400,900.0,"BOCAINA DO SUL, BR",7.0,",I",4.0,",I",...,,,,,,,,,,
9998,BR002749037,1976-06,-27.6800,-49.3700,454.0,"SALTINHO, BR",8.0,",I",2.0,",I",...,,,,,,,,,,


In [28]:
df2.to_csv('data_climate/dfLocation_2.csv')

In [29]:
df3 = location_collect(20000, 30000)

0


In [30]:
df3

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,DYSD,DYSD_ATTRIBUTES,EMSD,EMSD_ATTRIBUTES,WDFG,WDFG_ATTRIBUTES,WSFG,WSFG_ATTRIBUTES,DYTS,DYTS_ATTRIBUTES
0,BR002749039,1979-01,-27.2100,-49.6300,350.0,"RIO DO SUL NOVO PCD, BR",9.0,",I",2.0,",I",...,,,,,,,,,,
1,BR002749041,1983-01,-27.4100,-49.8300,850.0,"AGROLANDIA, BR",7.0,",I",4.0,",I",...,,,,,,,,,,
2,BR002749045,1986-09,-27.2000,-49.0900,0.0,"BOTUVERA MONTANTE, BR",7.0,",I",7.0,",I",...,,,,,,,,,,
3,BR002749046,1988-02,-27.3300,-49.3300,0.0,"SALSEIRO PCD, BR",12.0,",I",7.0,",I",...,,,,,,,,,,
4,BR002750001,1969-11,-27.9000,-50.7500,980.0,"CAMPO BELO DO SUL, BR",9.0,",I",8.0,",I",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,CA007024400,1906-05,45.4167,-73.9333,27.0,"MACDONALD COLLEGE, QC CA",11.0,",C",7.0,",C",...,,,,,,,,,,
9996,CA007024440,1948-07,45.2667,-72.1167,274.0,"MAGOG, QC CA",6.0,"5,C",5.0,"5,C",...,,,,,,,,,,
9997,CA007024615,1978-10,46.3333,-71.9833,96.0,"MANSEAU, QC CA",15.0,",C",9.0,",C",...,,,,,,,,,,
9998,CA007024623,1965-06,45.3333,-71.5000,366.0,"MAPLE LEAF, QC CA",9.0,",C",7.0,",C",...,,,,,,,,,,


In [31]:
df3.to_csv('data_climate/dfLocation_3.csv')

In [32]:
df4 = location_collect(30000, 40000)

0


In [33]:
df4

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,RHMX,RHMX_ATTRIBUTES,TSUN,TSUN_ATTRIBUTES,WDFM,WDFM_ATTRIBUTES,WDMV,WDMV_ATTRIBUTES,WSFM,WSFM_ATTRIBUTES
0,CA007024625,1973-01,45.3167,-71.4667,445.0,"MAPLE LEAF SOUTH, QC CA",16.0,",C",8.0,",C",...,,,,,,,,,,
1,CA007024627,1960-06,45.4000,-73.1333,38.0,"MARIEVILLE, QC CA",10.0,",C",8.0,",C",...,,,,,,,,,,
2,CA007024628,1965-04,45.3000,-71.7333,259.0,"MARTINVILLE, QC CA",8.0,",C",6.0,",C",...,,,,,,,,,,
3,CA007024745,1994-08,45.5000,-73.5833,73.0,"MCTAVISH, QC CA",9.0,"5,C",5.0,"5,C",...,,,,,,,,,,
4,CA007024800,1939-11,45.5833,-70.8667,415.0,"MEGANTIC A, QC CA",9.0,",C",1.0,",C",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,JA000047424,1951-01,42.6170,141.5500,11.0,"TOMAKOMAI, JA",12.0,",I",5.0,",I",...,,,,,,,,,,
9996,JA000047426,1951-01,42.1670,142.7830,37.0,"URAKAWA, JA",11.0,",I",2.0,",I",...,,,,,,,,,,
9997,JA000047428,1951-01,41.8670,140.1170,12.0,"ESASHI, JA",27.0,",I",6.0,",I",...,,,,,,,,,,
9998,JA000047430,1951-01,41.8170,140.7500,43.0,"HAKODATE, JA",17.0,",I",3.0,",I",...,,,,,,,,,,


In [34]:
df4.to_csv('data_climate/dfLocation_4.csv')

In [39]:
df5 = location_collect(40000, 50000)

0
10000


In [40]:
df5

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,CDSD,CDSD_ATTRIBUTES,CLDD,CLDD_ATTRIBUTES,...,ASTP,ASTP_ATTRIBUTES,AWBT,AWBT_ATTRIBUTES,RHAV,RHAV_ATTRIBUTES,RHMN,RHMN_ATTRIBUTES,RHMX,RHMX_ATTRIBUTES
0,JA000047435,1956-01,44.350,143.350,16.0,"MOMBETSU, JA",0.0,I,0.0,",I",...,,,,,,,,,,
1,JA000047440,1958-01,42.300,143.317,33.0,"HIROO, JA",0.0,I,0.0,",I",...,,,,,,,,,,
2,JA000047512,1964-01,39.067,141.717,41.0,"OFUNATO, JA",0.0,I,0.0,",I",...,,,,,,,,,,
3,JA000047520,1958-01,38.750,140.317,102.0,"SHINJO, JA",0.0,I,0.0,"2,I",...,,,,,,,,,,
4,JA000047570,1954-01,37.483,139.917,213.0,"WAKAMATSU, JA",0.0,I,0.0,",I",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,SF007227210,1913-04,-23.020,29.920,1030.0,"GROBLERSPLAAS, SF",,,,,...,,,,,,,,,,
9996,SF007227490,1924-05,-23.470,29.880,1128.0,"MAASBULT, SF",,,,,...,,,,,,,,,,
9997,SF007230700,1903-10,-23.170,30.070,875.0,"ELIM HOSP, SF",,,,,...,,,,,,,,,,
9998,SF007231550,1923-02,-23.070,30.130,853.0,"GOEDEHOOP BOS, SF",,,,,...,,,,,,,,,,


In [41]:
df5.to_csv('data_climate/dfLocation_5.csv')

In [42]:
df6 = location_collect(60000, 70000)

0
10000


In [43]:
df6

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,HDSD,HDSD_ATTRIBUTES,HTDD,HTDD_ATTRIBUTES,TAVG,TAVG_ATTRIBUTES,TMAX,TMAX_ATTRIBUTES,TMIN,TMIN_ATTRIBUTES
0,US1COLR1205,2019-07,40.390383,-105.491471,2372.0,"ESTES PARK 2.0 NE, CO US",16.0,"1,N",5.0,"1,N",...,,,,,,,,,,
1,US1COLR1212,2020-03,40.534990,-105.089750,1548.1,"FORT COLLINS 1.8 SW, CO US",7.0,"3,N",3.0,"3,N",...,,,,,,,,,,
2,US1COLR1213,2020-08,40.507750,-104.965240,1475.8,"TIMNATH 1.8 SSE, CO US",5.0,"4,N",1.0,"4,N",...,,,,,,,,,,
3,US1COLR1216,2022-10,40.810340,-105.215840,1826.4,"LIVERMORE 4.2 N, CO US",4.0,",N",2.0,",N",...,,,,,,,,,,
4,US1COLR1217,2020-04,40.635710,-105.159860,1559.4,"LAPORTE 1.9 NW, CO US",9.0,",N",3.0,",N",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,US1MANF0036,2018-05,42.244574,-70.956462,10.7,"WEYMOUTH 2.8 NW, MA US",,,,,...,,,,,,,,,,
9996,US1MANF0039,2018-10,42.243336,-70.954796,15.8,"WEYMOUTH 2.3 N, MA US",17.0,",N",9.0,",N",...,,,,,,,,,,
9997,US1MANF0047,2019-05,42.208230,-71.235180,57.3,"WESTWOOD 1.1 WSW, MA US",,,,,...,,,,,,,,,,
9998,US1MANF0049,2019-06,42.234965,-71.147056,28.0,"DEDHAM 1.8 ESE, MA US",18.0,"1,N",9.0,"1,N",...,,,,,,,,,,


In [44]:
df6.to_csv('data_climate/dfLocation_6.csv')

In [45]:
df7 = location_collect(70000, 80000)

0
10000


In [46]:
df7

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,HDSD,HDSD_ATTRIBUTES,HTDD,HTDD_ATTRIBUTES,TAVG,TAVG_ATTRIBUTES,TMAX,TMAX_ATTRIBUTES,TMIN,TMIN_ATTRIBUTES
0,US1MANF0054,2019-11,42.259033,-71.030317,30.5,"QUINCY 1.2 W, MA US",12.0,"4,N",10.0,"4,N",...,,,,,,,,,,
1,US1MANF0058,2020-04,42.008300,-71.338500,63.7,"PLAINVILLE 0.6 NNW, MA US",15.0,",N",11.0,",N",...,,,,,,,,,,
2,US1MANF0062,2020-09,42.074391,-71.408504,92.7,"FRANKLIN 1.4 SW, MA US",6.0,",N",3.0,",N",...,,,,,,,,,,
3,US1MANF0063,2021-01,42.117610,-71.337902,61.6,"NORFOLK 1.1 W, MA US",9.0,",N",5.0,",N",...,,,,,,,,,,
4,US1MANF0064,2021-03,42.138006,-71.440061,60.4,"MEDWAY 2.1 W, MA US",5.0,"1,N",3.0,"1,N",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,US1NYON0017,2019-12,42.822000,-77.288400,256.6,"CANANDAIGUA 4.6 S, NY US",14.0,",N",8.0,",N",...,,,,,,,,,,
9996,US1NYON0018,2019-11,42.840972,-77.225832,281.0,"CANANDAIGUA 4.3 SE, NY US",9.0,"1,N",6.0,"1,N",...,,,,,,,,,,
9997,US1NYON0019,2020-09,42.627900,-77.428600,422.5,"NAPLES 1.6 WNW, NY US",8.0,",N",4.0,",N",...,,,,,,,,,,
9998,US1NYON0022,2022-05,42.851220,-76.998700,183.5,"GENEVA 1.2 SW, NY US",12.0,",N",5.0,",N",...,,,,,,,,,,


In [47]:
df7.to_csv('data_climate/dfLocation_7.csv')

In [48]:
df8 = location_collect(80000, 90000)

0
10000


In [49]:
df8

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,DSND,DSND_ATTRIBUTES,DYSD,DYSD_ATTRIBUTES,EMSD,EMSD_ATTRIBUTES,DYFG,DYFG_ATTRIBUTES,DYTS,DYTS_ATTRIBUTES
0,US1NYOR0004,2013-09,41.268357,-74.415952,189.3,"WARWICK 3.2 WNW, NY US",5.0,",N",5.0,",N",...,,,,,,,,,,
1,US1NYOR0006,2009-10,41.301445,-74.166969,253.0,"MONROE 1.7 SE, NY US",13.0,",N",8.0,",N",...,,,,,,,,,,
2,US1NYOR0015,2014-10,41.374007,-74.684483,142.3,"PORT JERVIS 0.4 SE, NY US",15.0,",N",7.0,",N",...,,,,,,,,,,
3,US1NYOR0017,2017-07,41.587962,-74.357663,126.8,"PINE BUSH 3.4 WSW, NY US",13.0,"1,N",10.0,"1,N",...,,,,,,,,,,
4,US1NYOR0018,2017-09,41.542690,-74.188349,137.8,"WALDEN 1.2 S, NY US",8.0,",N",4.0,",N",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,US1TXVC0004,2007-10,28.822000,-96.961000,29.0,"VICTORIA 1.3 E, TX US",7.0,",N",5.0,",N",...,,,,,,,,,,
9996,US1TXVC0007,2008-04,28.795720,-96.984380,34.1,"VICTORIA 2.0 S, TX US",7.0,"3,N",6.0,"3,N",...,,,,,,,,,,
9997,US1TXVC0009,2008-11,28.804625,-96.826581,21.9,"INEZ 5.3 SSW, TX US",5.0,"3,N",2.0,"3,N",...,,,,,,,,,,
9998,US1TXVC0011,2009-06,28.843042,-96.799064,15.8,"INEZ 2.2 S, TX US",1.0,"4,N",1.0,"4,N",...,,,,,,,,,,


In [50]:
df8.to_csv('data_climate/dfLocation_8.csv')

In [51]:
df9 = location_collect(90000, 100000)

0
10000


In [52]:
df9

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,LX08,LX08_ATTRIBUTES,MN07,MN07_ATTRIBUTES,MN08,MN08_ATTRIBUTES,MX07,MX07_ATTRIBUTES,MX08,MX08_ATTRIBUTES
0,US1TXVC0015,2010-03,28.844667,-97.163211,56.7,"VICTORIA 11.0 W, TX US",6.0,",N",5.0,",N",...,,,,,,,,,,
1,US1TXVC0017,2010-04,28.853700,-96.990300,33.2,"VICTORIA 2.1 NNW, TX US",6.0,",N",2.0,",N",...,,,,,,,,,,
2,US1TXVC0020,2010-07,28.778986,-96.831036,18.3,"VICTORIA 9.7 ESE, TX US",17.0,"3,N",12.0,"3,N",...,,,,,,,,,,
3,US1TXVC0021,2010-07,28.659784,-97.118868,32.3,"VICTORIA 14.0 SW, TX US",16.0,",N",12.0,",N",...,,,,,,,,,,
4,US1TXVC0022,2011-02,28.842100,-97.182317,49.4,"VICTORIA 12.1 W, TX US",6.0,"1,N",1.0,"1,N",...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,USC00143984,1904-09,37.923300,-95.424100,290.8,"IOLA 1 W, KS US",5.0,",6",4.0,",6",...,,,,,,,,,,
9996,USC00143989,1905-09,37.916670,-95.400000,292.9,"IOLA, KS US",13.0,",0",9.0,",0",...,,,,,,,,,,
9997,USC00143997,1894-01,39.661100,-98.348300,468.5,"IONIA, KS US",2.0,",6",1.0,",6",...,,,,,,,,,,
9998,USC00144008,1910-03,37.833333,-101.933333,,"IRENE, KS US",1.0,",6",0.0,",6",...,,,,,,,,,,


In [53]:
df9.to_csv('data_climate/dfLocation_9.csv')

In [54]:
df10 = location_collect(100000, 110000)

0
10000


In [55]:
df10

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,DP01,DP01_ATTRIBUTES,DP10,DP10_ATTRIBUTES,...,RHMN,RHMN_ATTRIBUTES,RHMX,RHMX_ATTRIBUTES,TSUN,TSUN_ATTRIBUTES,WDF1,WDF1_ATTRIBUTES,WSF1,WSF1_ATTRIBUTES
0,USC00144025,1988-03,39.614700,-97.856300,418.8,"JAMESTOWN, KS US",3.0,",6",2.0,",6",...,,,,,,,,,,
1,USC00144041,1894-03,39.600000,-102.033333,,"JAQUA, KS US",5.0,",6",2.0,",6",...,,,,,,,,,,
2,USC00144073,1940-07,38.720280,-100.526390,781.8,"JEROME, KS US",6.0,",6",5.0,",6",...,,,,,,,,,,
3,USC00144081,1900-12,38.083330,-99.900000,701.6,"JETMORE, KS US",2.0,",6",0.0,",6",...,,,,,,,,,,
4,USC00144085,1949-05,38.216670,-100.066670,716.9,"JETMORE 14 NW, KS US",,,,,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9995,USC00365611,1952-10,41.716670,-80.233330,345.0,"MEADVILLE 7 NW, PA US",8.0,",0",7.0,",0",...,,,,,,,,,,
9996,USC00365623,1915-01,39.933333,-75.366667,64.0,"MEDIA, PA US",14.0,",6",9.0,",6",...,,,,,,,,,,
9997,USC00365627,1948-05,41.283330,-78.400000,335.9,"MEDIX RUN, PA US",16.0,",0",13.0,",0",...,,,,,,,,,,
9998,USC00365650,1949-01,41.200000,-80.350000,390.1,"MERCER 6 W, PA US",13.0,",0",11.0,",0",...,,,,,,,,,,


In [56]:
df10.to_csv('data_climate/dfLocation_10.csv')

In [57]:
df11 = location_collect(num1 = 110000)

0
12041


In [58]:
df11

Unnamed: 0,STATION,DATE,LATITUDE,LONGITUDE,ELEVATION,NAME,CDSD,CDSD_ATTRIBUTES,CLDD,CLDD_ATTRIBUTES,...,RHAV,RHAV_ATTRIBUTES,RHMN,RHMN_ATTRIBUTES,RHMX,RHMX_ATTRIBUTES,WDF1,WDF1_ATTRIBUTES,WSF1,WSF1_ATTRIBUTES
0,USC00365652,1950-10,41.28333,-80.28333,402.9,"MERCER 4 NW, PA US",,,0.0,",0",...,,,,,,,,,,
1,USC00365654,1948-05,41.23333,-80.25000,381.0,"MERCER HIGHWAY SHED, PA US",,,,,...,,,,,,,,,,
2,USC00365662,1929-07,39.83333,-77.90000,164.9,"MERCERSBURG 1 E, PA US",,,,,...,,,,,,,,,,
3,USC00365676,1925-07,40.96667,-75.46667,300.2,"MERWINSBURG, PA US",,,,,...,,,,,,,,,,
4,USC00365684,1939-04,39.81667,-79.01667,641.0,"MEYERSDALE, PA US",,,,,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
12036,ZI000067969,1962-07,-21.05000,29.36700,861.0,"WEST NICHOLSON, ZI",1.6,Q,1.6,",Q",...,,,,,,,,,,
12037,ZI000067975,1951-07,-20.06700,30.86700,1095.0,"MASVINGO, ZI",0.0,Q,0.0,",Q",...,,,,,,,,,,
12038,ZI000067977,1968-06,-21.01700,31.58300,430.0,"BUFFALO RANGE, ZI",,,2.4,",Q",...,,,,,,,,,,
12039,ZI000067983,1951-07,-20.20000,32.61600,1132.0,"CHIPINGE, ZI",1.0,Q,1.0,",Q",...,,,,,,,,,,


In [59]:
df11.to_csv('data_climate/dfLocation_11.csv')