Skip to content

Commit

Permalink
Corrections for CDH4 release and CDH5.
Browse files Browse the repository at this point in the history
- updates CDH4 dependencies to final release (beta artifacts are no long available)
- remove use of CASE as variable name, since it became a reserved word in CDH5
- corrects error in gephi generation; corrected xml validates according to gephi xmlschema
- update pom version to reflect change
  • Loading branch information
busbey committed Jan 21, 2016
1 parent 78674a2 commit e94d18d
Show file tree
Hide file tree
Showing 3 changed files with 8 additions and 7 deletions.
7 changes: 4 additions & 3 deletions pom.xml
Expand Up @@ -4,27 +4,28 @@

<groupId>com.cloudera.science</groupId>
<artifactId>ades</artifactId>
<version>0.1.0</version>
<version>0.2.0</version>
<packaging>jar</packaging>

<name>ades</name>

<properties>
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
<hadoop.version>2.0.0-mr1-cdh4.0.0</hadoop.version>
</properties>

<dependencies>
<dependency>
<groupId>org.apache.hadoop</groupId>
<artifactId>hadoop-core</artifactId>
<version>0.23.1-mr1-cdh4.0.0b2</version>
<version>${hadoop.version}</version>
<scope>provided</scope>
</dependency>

<dependency>
<groupId>org.apache.hadoop</groupId>
<artifactId>hadoop-client</artifactId>
<version>0.23.1-mr1-cdh4.0.0b2</version>
<version>${hadoop.version}</version>
<scope>provided</scope>
</dependency>

Expand Down
6 changes: 3 additions & 3 deletions src/main/pig/step1_join_drugs_reactions.pig
Expand Up @@ -43,7 +43,7 @@ drugs = LOAD 'aers/drugs' USING PigStorage('$') AS (
vbm: long, route: chararray, dose_vbm: chararray, dechal: chararray, rechal: chararray,
lot: long, exp_dt: chararray, nda: long);
demos = LOAD 'aers/demos' USING PigStorage('$') AS (
isr: long, case: int, if_cod: chararray, foll_seq: chararray, image: chararray,
isr: long, case_id: int, if_cod: chararray, foll_seq: chararray, image: chararray,
event_dt: chararray, mfr_dt: chararray, fda_dt: chararray, rept_code: chararray,
mfr_num: chararray, mfr_sndr: chararray, age: long, age_code: chararray,
gender: chararray, e_sub: chararray, weight: long, wt_code: chararray,
Expand All @@ -70,8 +70,8 @@ demos = FILTER demos BY age_code == 'YR' and (gender == 'M' or gender == 'F') an
* For simplicity, we simply choose the minimum ISR number for each case identifier
* as the representative report for that patient.
*/
demos_by_case = GROUP demos BY case;
selected = FOREACH demos_by_case GENERATE MIN(demos.isr) as isr;
demos_by_case_id = GROUP demos BY case_id;
selected = FOREACH demos_by_case_id GENERATE MIN(demos.isr) as isr;

/**
* Now we filter the demographics data to only include the reports that we selected
Expand Down
2 changes: 1 addition & 1 deletion src/main/python/gephi.py
Expand Up @@ -44,7 +44,7 @@
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://www.gexf.net/1.2draft http://www.gexf.net/1.2draft/gexf.xsd"
version="1.2">
<meta lastmodifieddate="20111012">
<meta lastmodifieddate="2011-10-12">
<creator>Cloudera</creator>
<description>A network of drug-drug relationships</description>
</meta>
Expand Down

0 comments on commit e94d18d

Please sign in to comment.