Skip to content

ts-3156/nicodata2018

Folders and files

NameName
Last commit message
Last commit date

Latest commit

 

History

9 Commits
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 

Repository files navigation

nicodata2018

# Download files from 0000.zip to 3410.zip
wget -r URL
unzip 0000.zip
ruby parse.rb 0000.jsonl >0000.csv
create database if not exists nico_data default character set utf8mb4;

CREATE TABLE IF NOT EXISTS `videos`
(
  video_id    varchar(255) NOT NULL PRIMARY KEY,
  title       varchar(255),
  description text,
  watch_num   int(11),
  comment_num int(11),
  mylist_num  int(11),
  category    varchar(255),
  tags        text,
  upload_time datetime,
  file_type   varchar(255),
  length      int(11),
  size_high   int(11),
  size_low    int(11)
);

LOAD DATA LOCAL INFILE '/path/to/0000.csv'
INTO TABLE videos FIELDS TERMINATED BY ',' ENCLOSED BY '"';

SELECT tags FROM videos
INTO OUTFILE '/tmp/0000.tags.csv' FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"';
ruby split.rb 0000.tags.csv >0000.graph.csv

About

No description, website, or topics provided.

Resources

Stars

Watchers

Forks

Releases

No releases published

Packages

No packages published

Languages