forked from crowbar-archive/barclamp-hadoop
/
crowbar.yml
334 lines (326 loc) · 18.7 KB
/
crowbar.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
# Copyright 2011, Dell, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# Author: RobHirschfeld
#
barclamp:
name: hadoop
display: Hadoop
version: 0
requires:
- @crowbar
member:
- apachehadoop
crowbar:
layout: 1
order: 200
run_order: 200
chef_order: 200
nav:
barclamps:
hadoop: index_barclamp_path(:controller=>'hadoop')
help:
hadoop_ug: '"/hadoop_users_guide.pdf", { :link => { :target => "_blank" } }'
locale_additions:
en:
nav:
hadoop_ug: Hadoop
hadoop: Hadoop
barclamp:
hadoop:
edit_deployment:
deployment: Deployment
edit_attributes:
core_attributes: Hadoop Core Attributes
cloudera_enterprise_scm: Cloudera Enterprise Support
fs_checkpoint_dir: Checkpoint Directory
fs_checkpoint_edits_dir: Checkpoint Edits Directory
fs_checkpoint_period: Checkpoint Time Period
fs_checkpoint_size: Checkpoint Size
fs_default_name: File System Default Name
fs_file_impl: File URI Handler Class
fs_ftp_impl: FTP URI Handler Class
fs_har_impl: HAR URI Handler Class
fs_har_impl_disable_cache: Disable Cache
fs_hdfs_impl: HDFS URI Handler Class
fs_hftp_impl: HFTP URI Handler Class
fs_hsftp_impl: HSFTP URI Handler Class
fs_kfs_impl: KFS URI Handler Class
fs_ramfs_impl: RAMFS URI Handler Class
fs_s3_block_size: S3 Block Size
fs_s3_buffer_dir: S3 Buffer Directory
fs_s3_impl: S3 URI Handler Class
fs_s3_maxRetries: S3 Maximum Retty Count
fs_s3_sleepTimeSeconds: S3 Sleep Time
fs_s3n_impl: S3N URI Handler Class
fs_trash_interval: Trash Interval
hadoop_http_filter_initializers: HTTP Filter Initializers
hadoop_logfile_count: Log File Count
hadoop_logfile_size: Log File Size
hadoop_native_lib: Native Library
hadoop_rpc_socket_factory_class_ClientProtocol: RPC Socket Factory Class Client Protocol
hadoop_rpc_socket_factory_class_default: RPC Socket Factory Class Default
hadoop_security_authentication: Security Authentication
hadoop_security_authorization: Security Authorization
hadoop_security_group_mapping: Security Group Mapping
hadoop_security_uid_cache_secs: Security UID Cache Seconds
hadoop_socks_server: Socks Server
hadoop_tmp_dir: Temporary Directory
hadoop_util_hash_type: Utility Hash Type
io_bytes_per_checksum: Bytes Per Checksum
io_compression_codecs: Compression Codecs
io_file_buffer_size: File Buffer Size
io_mapfile_bloom_error_rate: Mapfile Bloom Error Rate
io_mapfile_bloom_size: Mapfile Bloom Size
io_seqfile_compress_blocksize: Sequential File Compress Block Size
io_seqfile_lazydecompress: Sequential File Lazy Decompress
io_seqfile_sorter_recordlimit: Sequential File Sorter Record Limit
io_serializations: Serializations
io_skip_checksum_errors: Skip Checksum Errors
ipc_client_connect_max_retries: IPC Client Connect Maximum Retries
ipc_client_connection_maxidletime: IPC Client Connection Maximum Idle Time
ipc_client_idlethreshold: IPC Client Idle Threshold
ipc_client_kill_max: IPC Client Kill Maximum
ipc_client_tcpnodelay: IPC Client TCP No Delay
ipc_server_listen_queue_size: IPC Server Listen Queue Size
ipc_server_tcpnodelay: IPC Server TCP No Delay
local_cache_size: Local Cache Size
topology_node_switch_mapping_impl: Topology Node Switch Mapping Class
topology_script_file_name: Topology Script File Name
topology_script_number_args: Topology Script Number Arguments
webinterface_private_actions: Web Interface Private Actions
env_attributes: Hadoop Environment Attributes
hadoop_datanode_opts: Hadoop Datanode Options
hadoop_heapsize: Hadoop Heapsize
hadoop_jobtracker_opts: Hadoop Jobtracker Options
hadoop_log_dir: Hadoop Log Directory
hadoop_namenode_opts: Hadoop Namenode Options
hadoop_secondarynamenode_opts: Hadoop Secondary Namenode Options
hadoop_tasktracker_opts: Hadoop Tasktracker Options
hdfs_attributes: Hadoop HDFS Attributes
dfs_access_time_precision: DFS Access Time Precision
dfs_balance_bandwidthPerSec: DFS Balance Bandwidth Per Second
dfs_block_access_key_update_interval: DFS Block Access Key Update Interval
dfs_block_access_token_enable: DFS Block Access Token Enable
dfs_block_access_token_lifetime: DFS Block Access Token Life Time
dfs_block_size: DFS Block Size
dfs_blockreport_initialDelay: DFS Block Report Initial Delay
dfs_blockreport_intervalMsec: DFS Block Report Interval
dfs_client_block_write_retries: DFS Client Block Write Retries
dfs_data_dir: DFS Data Directoryt
dfs_datanode_address: DFS Datanode Address
dfs_datanode_data_dir_perm: DFS Datanode Data Directory Permissions
dfs_datanode_dns_interface: DFS Datanode DNS Interface
dfs_datanode_dns_nameserver: DFS Datanode DNS Name Server
dfs_datanode_du_reserved: DFS Datanode Disk Units Reserved
dfs_datanode_failed_volumes_tolerated: DFS Datanode Failed Volumes Tolerated
dfs_datanode_handler_count: DFS Datanode Handler Count
dfs_datanode_http_address: DFS Datanode HTTP Address
dfs_datanode_https_address: DFS Datanode HTTPS Address
dfs_datanode_ipc_address: DFS Datanode IPC Address
dfs_default_chunk_view_size: DFS Default Chunck View Size
dfs_df_interval: DFS DF Interval
dfs_heartbeat_interval: DFS Heartbeat Interval
dfs_hosts: DFS Hosts
dfs_hosts_exclude: DFS Hosts Exclusion
dfs_http_address: DFS HTTP Address
dfs_https_address: DFS HTTPS Address
dfs_https_client_keystore_resource: DFS HTTPS Client Keystore Resource
dfs_https_enable: DFS HTTPS Enable
dfs_https_need_client_auth: DFS HTTPS Need Client Authorization
dfs_https_server_keystore_resource: DFS HTTPS Server Keystore Resource
dfs_max_objects: DFS Maximum Objects
dfs_name_dir: DFS Name Directory
dfs_name_edits_dir: DFS Name Edits Directory
dfs_namenode_decommission_interval: DFS Namenode Decommission Interval
dfs_namenode_decommission_nodes_per_interval: DFS Namenode Decommission Nodes Per Interval
dfs_namenode_delegation_key_update_interval: DFS Namenode Delegation Key Update Interval
dfs_namenode_delegation_token_max_lifetime: DFS Namenode Delegation Token Maximum Lifetime
dfs_namenode_delegation_token_renew_interval: DFS Namenode Delegation Token Renew Interval
dfs_namenode_handler_count: DFS Namenode Handler Count
dfs_namenode_logging_level: DFS Namenode Logging Level
dfs_permissions: DFS Permissions
dfs_permissions_supergroup: DFS Permissions Supergroup
dfs_replication: DFS Replication
dfs_replication_considerLoad: DFS Replication Consider Load
dfs_replication_interval: DFS Replication Interval
dfs_replication_max: DFS Replication Maximum
dfs_replication_min: DFS Replication Minimum
dfs_safemode_extension: DFS Safemode Extension
dfs_safemode_threshold_pct: DFS Safemode Threshold PCT
dfs_secondary_http_address: DFS Secondary HTTP Address
dfs_support_append: DFS Support Append
dfs_web_ugi: DFS Web UGI
mapred_attributes: Hadoop Map Reduce Attributes
attributes: Attributes
hadoop_job_history_location: Hadoop Job History Location
hadoop_job_history_user_location: Hadoop Job History User Location
hadoop_rpc_socket_factory_class_JobSubmissionProtocol: Hadoop RPC Socket Factory Class
io_map_index_skip: I/O Map Index Skip
io_sort_factor: I/O Sort Factor
io_sort_mb: I/O Sort Memory
io_sort_record_percent: I/O Sort Record Percent
io_sort_spill_percent: I/O Sort Spill Percent
job_end_retry_attempts: Job End Retry Attempts
job_end_retry_interval: Job End Retry Interval
jobclient_output_filter: Job Client Output Filter
keep_failed_task_files: Keep Failed Task Files
map_sort_class: Map Sort Class
mapred_acls_enabled: Map/Reduce ACLS Enabled
mapred_child_env: Map/Reduce Child Environment
mapred_child_java_opts: Map/Reduce Child Java Options
mapred_child_tmp: Map/Reduce Child Temporary Directory
mapred_child_ulimit: Map/Reduce Child Ulimit
mapred_cluster_map_memory_mb: Map/Reduce Cluster Map Memory
mapred_cluster_max_map_memory_mb: Map/Reduce Cluster Maximum Map Memory
mapred_cluster_max_reduce_memory_mb: Map/Reduce Cluster Maximum Reduce Memory
mapred_cluster_reduce_memory_mb: Map/Reduce Cluster Reduce Memory
mapred_compress_map_output: Map/Reduce Compress Map Output
mapred_healthChecker_interval: Map/Reduce Health Checker Interval
mapred_healthChecker_script_args: Map/Reduce Health Checker Script Arguments
mapred_healthChecker_script_path: Map/Reduce Health Checker Script Path
mapred_healthChecker_script_timeout: Map/Reduce Health Checker Script Timeout
mapred_heartbeats_in_second: Map/Reduce Heartbeats
mapred_hosts: Map/Reduce Hosts
mapred_hosts_exclude: Map/Reduce Hosts Exclusions
mapred_inmem_merge_threshold: Map/Reduce In memory Merge Threshold
mapred_job_map_memory_mb: Map/Reduce Job Map Memory
mapred_job_queue_name: Map/Reduce Job Queue Name
mapred_job_reduce_input_buffer_percent: Map/Reduce Job Reduce Input Buffer
mapred_job_reduce_memory_mb: Map/Reduce Job Reduce Memory
mapred_job_reuse_jvm_num_tasks: Map/Reduce Job Reuse JVM Number of Tasks
mapred_job_shuffle_input_buffer_percent: Map/Reduce Job Shuffle Input Buffer
mapred_job_shuffle_merge_percent: Map/Reduce Job Shuffle Merge Percent
mapred_job_tracker: Map/Reduce Job Tracker
mapred_job_tracker_handler_count: Map/Reduce Job Tracker Handler Count
mapred_job_tracker_history_completed_location: Map/Reduce Job Tracker History Completed Location
mapred_job_tracker_http_address: Map/Reduce Job Tracker HTTP Address
mapred_job_tracker_jobhistory_lru_cache_size: Map/Reduce Job Tracker Job History LRU Cache Size
mapred_job_tracker_persist_jobstatus_active: Map/Reduce Job Tracker Persist Job Status Active
mapred_job_tracker_persist_jobstatus_dir: Map/Reduce Job Tracker Persist Job Status Directory
mapred_job_tracker_persist_jobstatus_hours: Map/Reduce Job Tracker Persist Job Status Hours
mapred_job_tracker_retiredjobs_cache_size: Map/Reduce Job Tracker Retired Jobs Cache Size
mapred_jobtracker_blacklist_fault_bucket_width: Map/Reduce Job Tracker Blacklist Fault Bucket Width
mapred_jobtracker_blacklist_fault_timeout_window: Map/Reduce Job Tracker Blacklist Fault Timeout Window
mapred_jobtracker_completeuserjobs_maximum: Map/Reduce Job Tracker Complete User Jobs Maximum
mapred_jobtracker_job_history_block_size: Map/Reduce Job Tracker Job History Block Size
mapred_jobtracker_maxtasks_per_job: Map/Reduce Job Tracker Maximum Tasks Per Job
mapred_jobtracker_restart_recover: Map/Reduce Job Tracker Restart Recover
mapred_jobtracker_taskScheduler: Map/Reduce Job Tracker Task Scheduler
mapred_jobtracker_taskScheduler_maxRunningTasksPerJob: Map/Reduce Job Task Scheduler Maximu Tasks Per Job
mapred_line_input_format_linespermap: Map/Reduce Line Input Lines Per Map
mapred_local_dir: Map/Reduce Local Directory
mapred_local_dir_minspacekill: Map/Reduce Minimum Space Kill
mapred_local_dir_minspacestart: Map/Reduce Minimum Space Start
mapred_map_max_attempts: Map/Reduce Maximum Map Attempts
mapred_map_output_compression_codec: Map/Reduce Map Output Compression Codec
mapred_map_tasks: Map/Reduce Map Tasks
mapred_map_tasks_speculative_execution: Map/Reduce Map Tasks Speculative Execution
mapred_max_tracker_blacklists: Map/Reduce Maximum Tracker Blacklists
mapred_max_tracker_failures: Map/Reduce Maximum Tracker Failures
mapred_merge_recordsBeforeProgress: Map/Reduce Merge Records Before Progress
mapred_min_split_size: Map/Reduce Minimum Split Size
mapred_output_compress: Map/Reduce Output Compress
mapred_output_compression_codec: Map/Reduce Output Compression Codec
mapred_output_compression_type: Map/Reduce Output Compression Type
mapred_queue_default_state: Map/Reduce Queue Default State
mapred_queue_names: Map/Reduce Queue Names
mapred_reduce_copy_backoff: Map/Reduce Copy Backoff
mapred_reduce_max_attempts: Map/Reduce Maximum Attempts
mapred_reduce_parallel_copies: Map/Reduce Reduce Parallel Copies
mapred_reduce_slowstart_completed_maps: Map/Reduce Reduce Slow Start Completed Maps
mapred_reduce_tasks: Map/Reduce Tasks
mapred_reduce_tasks_speculative_execution: Map/Reduce Tasks Speculative Execution
mapred_skip_attempts_to_start_skipping: Map/Reduce Skip Attempts To Start Skipping
mapred_skip_map_auto_incr_proc_count: Map/Reduce Skip Map Auto Increment Proc Count
mapred_skip_map_max_skip_records: Map/Reduce Skip Map Maximum Skip Records
mapred_skip_out_dir: Map/Reduce Skip Output Directory
mapred_skip_reduce_auto_incr_proc_count: Map/Reduce Skip Reduce Auto Increment Proc Count
mapred_skip_reduce_max_skip_groups: Map/Reduce Skip Reduce Maximum Skip Groups
mapred_submit_replication: Map/Reduce Submit Replication
mapred_system_dir: Map/Reduce System Directory
mapred_task_cache_levels: Map/Reduce Task Cache Levels
mapred_task_profile: Map/Reduce Task Profile
mapred_task_profile_maps: Map/Reduce Task Profile Maps
mapred_task_profile_reduces: Map/Reduce Task Profile Reduces
mapred_task_timeout: Map/Reduce Task Timeout
mapred_task_tracker_http_address: Map/Reduce Task Tracker HTTP Address
mapred_task_tracker_report_address: Map/Reduce Task Tracker Report Address
mapred_task_tracker_task_controller: Map/Reduce Task Tracker Task Controller
mapred_tasktracker_dns_interface: Map/Reduce Task Tracker DNS Interface
mapred_tasktracker_dns_nameserver: Map/Reduce Task Tracker DNS Name Server
mapred_tasktracker_expiry_interval: Map/Reduce Task Tracker Expiry Interval
mapred_tasktracker_indexcache_mb: Map/Reduce Task Tracker Index Cache Size
mapred_tasktracker_map_tasks_maximum: Map/Reduce Task Tracker Map Tasks Maximum
mapred_tasktracker_memory_calculator_plugin: Map/Reduce Task Tracker Memory Calculator Plugin
mapred_tasktracker_reduce_tasks_maximum: Map/Reduce Task Tracker Reduce Tasks Maximum
mapred_tasktracker_taskmemorymanager_monitoring_interval: Map/Reduce Task Tracker Memory Manager Monitoring Interval
mapred_tasktracker_tasks_sleeptime_before_sigkill: Map/Reduce Task Tracker Tasks Sleep Time Before Sigkill
mapred_temp_dir: Map/Reduce Temporary Directory
mapred_user_jobconf_limit: Map/Reduce User Job Conf Limit
mapred_userlog_limit_kb: Map/Reduce User Log Limit
mapred_userlog_retain_hours: Map/Reduce User Log Retain Hours
mapreduce_job_acl_modify_job: Map/Reduce Job ACL Modify Job
mapreduce_job_acl_view_job: Map/Reduce Job ACL View Job
mapreduce_job_complete_cancel_delegation_tokens: Map/Reduce Job Complete Cancel Delegation Tokens
mapreduce_job_counters_limit: Map/Reduce Job Counters Limit
mapreduce_job_split_metainfo_maxsize: Map/Reduce Job Split Metainfo Maximum Size
mapreduce_jobtracker_staging_root_dir: Map/Reduce Jobtracker Staging Root Dir
mapreduce_reduce_input_limit: Map/Reduce Reduce Input Limit
mapreduce_reduce_shuffle_connect_timeout: Map/Reduce Reduce Shuffle Connect Timeout
mapreduce_reduce_shuffle_read_timeout: Map/Reduce Reduce Shuffle Read Timeout
mapreduce_tasktracker_group: Map/Reduce Task Tracker Group
mapreduce_tasktracker_outofband_heartbeat: Map/Reduce Task Tracker Out Of Band Heartbeat
tasktracker_http_threads: Map/Reduce Task Tracker HTTP Threads
scheduler_attributes: Hadoop Scheduler Attributes
default_min_share_preemption_timeout: Default Minimum Share Preemption Timeout
default_pool_scheduling_mode: Default Pool Scheduling Mode
fair_share_preemption_timeout: Fair Share Preemption Timeout
pool_max_jobs_default: Pool Maximum Jobs Default
user_max_jobs_default: User Maximum Jobs Default
index:
barclamp: Project
state: Status
proposal: Proposal
description: Description
instructions: Apply proposals in order from top to bottom. Allow each proposal to enter ready state before applying the next one.
rpms:
redhat-5.7:
repos:
- bare cloudera-cdh3 10 http://archive.cloudera.com/redhat/cdh/3/
centos-5.7:
repos:
- bare cloudera-cdh3 10 http://archive.cloudera.com/redhat/cdh/3/
redhat-6.2:
repos:
- bare cloudera-cdh3 10 http://archive.cloudera.com/redhat/6/x86_64/cdh/3
centos-6.2:
repos:
- bare cloudera-cdh3 10 http://archive.cloudera.com/redhat/6/x86_64/cdh/3
pkgs:
# JDK dependency will be magically satisfied by the Java package below.
# - jdk
- hadoop-0.20
- hadoop-0.20-namenode
- hadoop-0.20-jobtracker
- hadoop-0.20-secondarynamenode
- hadoop-0.20-datanode
- hadoop-0.20-tasktracker
- hadoop-0.20-sbin
- hadoop-0.20-native
extra_files:
- http://download.oracle.com/otn-pub/java/jdk/6u27-b07/jdk-6u27-linux-x64-rpm.bin java
build_cmd: build-jdk.sh
smoketest:
timeout: 900