- ubuntu 18.04 기준
sudo apt update
sudo apt install google-chrome-stable g++ openjdk-8-jdk python3-dev python3-pip curl unzip -y
pip3 install selenium bs4 konlpy elasticsearch
wget -q -O - https://dl-ssl.google.com/linux/linux_signing_key.pub | sudo apt-key add -
sudo sh -c 'echo "deb [arch=amd64] http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list'
sudo apt update
sudo apt install google-chrome-stable
google-chrome --version # 크롬 버전확인
wget -N http://chromedriver.storage.googleapis.com/<VERSION>/chromedriver_linux64.zip -P <File Path>
unzip <File Path>/chromedriver_linux64.zip
{
"settings":{
"analysis":{
"analyzer":{
"pos_analyzer":{
"type":"custom",
"tokenizer":"hanguel_tokenizer",
"filter":[
"lowercase",
"trim",
],
},
"completion_analyzer":{
"type":"custom",
"char_filter":["jaso_char"],
"tokenizer":"icu_tokenizer"
},
},
"char_filter":{
"jaso_char":{
"type":"icu_normalizer",
"name":"nfkc_cf",
"mode":"decompose"
},
},
"tokenizer":{
"hanguel_tokenizer":{
"type":"seunjeon_tokenizer",
"deniflect":"true",
"decompound":"false",
"index_eojeol":"false",
"index_poses":["N", "V", "M", "UNK"],
"pos_tagging":"false",
"max_unk_length":8,
},
},
},
},
"mappings":{
"doc":{
"dynamic":"true",
"properties": {
"title":{
"type":"text",
"analyzer":"pos_analyzer",
"copy_to":["title_completion"],
},
"title_completion":{
"type":"completion",
"analyzer":"completion_analyzer",
},
"company":{
"type":"keyword",
},
"job":{
"type":"keyword",
},
"tech":{
"type":"keyword",
},
"level":{
"type":"integer_range",
},
"url":{
"type":"keyword",
"index":"false",
"norms":"false",
},
"start_date":{
"type":"date",
"format":"yyyyMMdd",
},
},
},
},
}
{
"settings":{
"analysis":{
"analyzer":{
"completion_analyzer":{
"type":"custom",
"char_filter":["jaso_char"],
"tokenizer":"icu_tokenizer"
}
},
"char_filter":{
"jaso_char":{
"type":"icu_normalizer",
"name":"nfkc_cf",
"mode":"decompose"
}
},
}
},
"mappings":{
"doc":{
"dynamic":"true",
"properties": {
"tech":{
"type":"completion",
"analyzer":"completion_analyzer"
},
}
}
}
}
{
- url: -ex) https://gitlab.com/geekermeter/data/-/edit/master/README.md
- title -ex) [FIFA ONLINE 4] Feature Game Client Engineer
- origin -ex) EA Korea
- start_date -ex) 3.11 (need to be same, but not yet)
- newbie -ex) 신입, 경력
- content
}
- coupang
- kakao
- naver
- ncsoft
- netmarble
- nexon
- programmers
- rocketpunch
사이트 | URL | Title | origin | start_date | newbie | content | auto |
---|---|---|---|---|---|---|---|
coupang | O | X | X | X | X | X | X |
kakao | O | X | X | X | X | X | X |
naver | O | X | X | X | X | X | X |
ncsoft | O | X | X | X | X | X | X |
netmarble | O | X | X | X | X | X | X |
nexon | O | O | O | O | O | O | X |
programmers | O | O | O | O | O | O | O |
rocketpunch | O | O | O | O | O | O | O |