Versions Compared

Key

  • This line was added.
  • This line was removed.
  • Formatting was changed.

...

job.name=CSVToAvroQuickStart

 

fs.uri=hdfs://localhost:9000

 

converter.classes=org.apache.gobblin.converter.csv.CsvToJsonConverter,org.apache.gobblin.converter.avro.JsonIntermediateToAvroConverter

writer.builder.class=org.apache.gobblin.writer.AvroDataWriterBuilder


source.class=org.apache.gobblin.source.extractor.filebased.TextFileBasedSource 

source.filebased.data.directory=${fs.uri}/source

source.schema=[{"columnName":"ID","comment":"","isNullable":"true","dataType":{"type":"String"}},{"columnName":"NAME","comment":"","isNullable":"true","dataType":{"type":"String"}}]

source.skip.first.record=false

 

extract.table.name=CsvToAvro

extract.namespace=org.apache.gobblin.example

extract.table.type=APPEND_ONLY

 

converter.csv.to.json.delimiter=","

 

writer.output.format=AVRO

writer.destination.type=HDFS

writer.fs.uri=${fs.uri}

writer.staging.dir=/writer-staging

writer.output.dir=/output

 

state.store.dir=/state

state.store.fs.uri=hdfs://localhost:9000

state.store.dir=/gobblin-kafka/state-store

data.publisher.final.dir=/final

 

  • Run gobblin-standalone.sh
    • bin/gobblin-standalone.sh start --conf ~/gobblin/conf/ex.pull