Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- job.name=TestParquet
- job.group=Test
- job.description=this is a test job that pulls from a test source and writes to Parquet
- job.lock.enabled=false
- task.execution.synchronousExecutionModel=false
- source.class=org.apache.gobblin.test.SequentialTestSource
- source.numParallelism=2
- source.inMemFormat=JSON
- fs.uri=file:///
- work.dir=/Users/sdas/gobblin-work/parquetWorkDir
- converter.classes=org.apache.gobblin.converter.parquet.JsonIntermediateToParquetGroupConverter
- extract.table.name=TestData
- extract.namespace=org.apache.gobblin.example
- extract.table.type=APPEND_ONLY
- state.store.enabled=true
- state.store.fs.uri=${fs.uri}
- state.store.dir=${work.dir}/store
- writer.destination.type=HDFS
- writer.output.format=PARQUET
- writer.fs.uri=${fs.uri}
- writer.builder.class=org.apache.gobblin.writer.ParquetDataWriterBuilder
- data.publisher.fs.uri=${fs.uri}
- data.publisher.type=org.apache.gobblin.publisher.BaseDataPublisher
- data.publisher.final.dir=${work.dir}/test_data
- data.publisher.metadata.output.dir=${work.dir}/metadata
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement