forked from D-Net/dnet-hadoop
[orcid] download of the lambda file defined in a script
This commit is contained in:
parent
55964cbd81
commit
e5abbec2ba
|
@ -0,0 +1,3 @@
|
|||
wget -O /tmp/last_modified.csv.tar http://74804fb637bd8e2fba5b-e0a029c2f87486cddec3b416996a6057.r3.cf1.rackcdn.com/last_modified.csv.tar
|
||||
hdfs dfs -copyFromLocal /tmp/last_modified.csv.tar /data/orcid_activities_2020/last_modified.csv.tar
|
||||
rm -f /tmp/last_modified.csv.tar
|
|
@ -24,12 +24,6 @@
|
|||
<name>token</name>
|
||||
<description>access token</description>
|
||||
</property>
|
||||
<property>
|
||||
<name>shell_cmd</name>
|
||||
<value>wget -O /tmp/last_modified.csv.tar http://74804fb637bd8e2fba5b-e0a029c2f87486cddec3b416996a6057.r3.cf1.rackcdn.com/last_modified.csv.tar ; hdfs dfs -copyFromLocal /tmp/last_modified.csv.tar /data/orcid_activities_2020/last_modified.csv.tar ; rm -f /tmp/last_modified.csv.tar
|
||||
</value>
|
||||
<description>the shell command that downloads the lambda file from orcid containing last orcid update informations</description>
|
||||
</property>
|
||||
<property>
|
||||
<name>sparkDriverMemory</name>
|
||||
<value>7G</value>
|
||||
|
@ -103,9 +97,8 @@
|
|||
<shell xmlns="uri:oozie:shell-action:0.1">
|
||||
<job-tracker>${jobTracker}</job-tracker>
|
||||
<name-node>${nameNode}</name-node>
|
||||
<exec>bash</exec>
|
||||
<argument>-c</argument>
|
||||
<argument>${shell_cmd}</argument>
|
||||
<exec>get_orcid_lambda_file.sh</exec>
|
||||
<file>get_orcid_lambda_file.sh</file>
|
||||
<capture-output/>
|
||||
</shell>
|
||||
<ok to="GenLastModifiedSeq"/>
|
||||
|
|
Loading…
Reference in New Issue