Package gorsat.process
Class SparkRowSource
- java.lang.Object
-
- org.gorpipe.gor.model.GenomicIterator
-
- org.gorpipe.model.gor.iterators.RowSource
-
- gorsat.process.ProcessSource
-
- gorsat.process.SparkRowSource
-
- All Implemented Interfaces:
java.lang.AutoCloseable,java.util.Iterator<org.gorpipe.gor.model.Row>
public class SparkRowSource extends gorsat.process.ProcessSourceCreated by sigmar on 12/02/16.
-
-
Constructor Summary
Constructors Constructor Description SparkRowSource(java.lang.String[] cmds, java.lang.String type, boolean nor, org.gorpipe.gor.session.GorSession gpSession, java.lang.String chr, int pos, int end, int bs)SparkRowSource(java.lang.String sql, java.lang.String profile, java.lang.String parquet, java.lang.String type, boolean nor, org.gorpipe.spark.GorSparkSession gpSession, java.lang.String filter, java.lang.String filterFile, java.lang.String filterColumn, java.lang.String splitFile, java.lang.String chr, int pos, int end, boolean usestreaming, java.lang.String jobId, boolean useCpp, java.lang.String parts, int buckets, boolean tag)
-
Method Summary
All Methods Static Methods Instance Methods Concrete Methods Modifier and Type Method Description static org.apache.spark.sql.Dataset<org.apache.spark.sql.Row>analyse(org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset, java.lang.String gor)java.lang.StringcheckNested(java.lang.String cmd, org.gorpipe.gor.session.GorSession gpSession, java.lang.String[] errorStr)static booleancheckNor(org.apache.spark.sql.types.StructField[] fields)org.apache.spark.sql.Dataset<? extends org.gorpipe.gor.model.Row>checkRowFormat(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset)voidclose()org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row>getDataset()java.lang.StringgetHeader()voidgor()voidgorpipe(gorsat.Commands.Analysis pipeStep, boolean gor)static org.apache.spark.sql.Dataset<org.gorpipe.gor.model.Row>gorpipe(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset, java.lang.String gor)booleanhasNext()voidinit()booleanisBuffered()booleanisNor()static voidmain(java.lang.String[] args)org.gorpipe.gor.model.Rownext()booleanpushdownCalc(java.lang.String formula, java.lang.String colName)booleanpushdownCmd(java.lang.String cmd)booleanpushdownFilter(java.lang.String gorwhere)booleanpushdownGor(java.lang.String gor)booleanpushdownSelect(java.lang.String[] cols)booleanpushdownTop(int limit)booleanpushdownWrite(java.lang.String filename)static org.apache.spark.sql.types.StructTypeschemaFromRow(java.lang.String[] header, org.gorpipe.gor.model.Row row)voidsetPosition(java.lang.String seekChr, int seekPos)java.io.InputStreamsetRange(java.lang.String seekChr, int startPos, int endPos)-
Methods inherited from class org.gorpipe.model.gor.iterators.RowSource
bufferSize, bufferSize_$eq, getAvgBasesPerMilliSecond, getAvgBatchSize, getAvgRowsPerMilliSecond, getAvgSeekTimeMilliSecond, getBufferSize, getCurrentBatchLoc, getCurrentBatchRow, getCurrentBatchSize, getGorHeader, getParent, moveToPosition, moveToPosition$default$3, next, parent, parent_$eq, seek, setBufferSize, setParent, terminateReading
-
Methods inherited from class org.gorpipe.gor.model.GenomicIterator
clone, decStat, filter, getColnum, getContext, getEx, getLookup, getMonitor, getSourceName, incStat, init, initStats, isSourceAlreadyInserted, seek, select, selectHeader, setColnum, setContext, setEx, setHeader, setSourceAlreadyInserted, setSourceName
-
-
-
-
Constructor Detail
-
SparkRowSource
public SparkRowSource(java.lang.String sql, java.lang.String profile, java.lang.String parquet, java.lang.String type, boolean nor, org.gorpipe.spark.GorSparkSession gpSession, java.lang.String filter, java.lang.String filterFile, java.lang.String filterColumn, java.lang.String splitFile, java.lang.String chr, int pos, int end, boolean usestreaming, java.lang.String jobId, boolean useCpp, java.lang.String parts, int buckets, boolean tag) throws java.io.IOException, java.util.zip.DataFormatException- Throws:
java.io.IOExceptionjava.util.zip.DataFormatException
-
SparkRowSource
public SparkRowSource(java.lang.String[] cmds, java.lang.String type, boolean nor, org.gorpipe.gor.session.GorSession gpSession, java.lang.String chr, int pos, int end, int bs)
-
-
Method Detail
-
init
public void init()
-
isNor
public boolean isNor()
-
getDataset
public org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> getDataset()
-
gorpipe
public void gorpipe(gorsat.Commands.Analysis pipeStep, boolean gor)
-
gorpipe
public static org.apache.spark.sql.Dataset<org.gorpipe.gor.model.Row> gorpipe(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset, java.lang.String gor)
-
gor
public void gor()
-
schemaFromRow
public static org.apache.spark.sql.types.StructType schemaFromRow(java.lang.String[] header, org.gorpipe.gor.model.Row row)
-
checkNested
public java.lang.String checkNested(java.lang.String cmd, org.gorpipe.gor.session.GorSession gpSession, java.lang.String[] errorStr)
-
checkNor
public static boolean checkNor(org.apache.spark.sql.types.StructField[] fields)
-
hasNext
public boolean hasNext()
- Specified by:
hasNextin interfacejava.util.Iterator<org.gorpipe.gor.model.Row>- Overrides:
hasNextin classorg.gorpipe.gor.model.GenomicIterator
-
next
public org.gorpipe.gor.model.Row next()
- Specified by:
nextin interfacejava.util.Iterator<org.gorpipe.gor.model.Row>- Overrides:
nextin classorg.gorpipe.gor.model.GenomicIterator
-
setPosition
public void setPosition(java.lang.String seekChr, int seekPos)- Specified by:
setPositionin classorg.gorpipe.model.gor.iterators.RowSource
-
close
public void close()
- Specified by:
closein interfacejava.lang.AutoCloseable- Specified by:
closein classorg.gorpipe.model.gor.iterators.RowSource
-
setRange
public java.io.InputStream setRange(java.lang.String seekChr, int startPos, int endPos)- Specified by:
setRangein classgorsat.process.ProcessSource
-
getHeader
public java.lang.String getHeader()
- Overrides:
getHeaderin classorg.gorpipe.gor.model.GenomicIterator
-
isBuffered
public boolean isBuffered()
- Overrides:
isBufferedin classorg.gorpipe.gor.model.GenomicIterator
-
checkRowFormat
public org.apache.spark.sql.Dataset<? extends org.gorpipe.gor.model.Row> checkRowFormat(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset)
-
pushdownFilter
public boolean pushdownFilter(java.lang.String gorwhere)
- Overrides:
pushdownFilterin classorg.gorpipe.gor.model.GenomicIterator
-
pushdownCalc
public boolean pushdownCalc(java.lang.String formula, java.lang.String colName)- Overrides:
pushdownCalcin classorg.gorpipe.gor.model.GenomicIterator
-
pushdownSelect
public boolean pushdownSelect(java.lang.String[] cols)
- Overrides:
pushdownSelectin classorg.gorpipe.gor.model.GenomicIterator
-
pushdownWrite
public boolean pushdownWrite(java.lang.String filename)
- Overrides:
pushdownWritein classorg.gorpipe.gor.model.GenomicIterator
-
pushdownCmd
public boolean pushdownCmd(java.lang.String cmd)
- Overrides:
pushdownCmdin classorg.gorpipe.gor.model.GenomicIterator
-
analyse
public static org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> analyse(org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset, java.lang.String gor)
-
pushdownGor
public boolean pushdownGor(java.lang.String gor)
- Overrides:
pushdownGorin classorg.gorpipe.gor.model.GenomicIterator
-
pushdownTop
public boolean pushdownTop(int limit)
- Overrides:
pushdownTopin classorg.gorpipe.gor.model.GenomicIterator
-
main
public static void main(java.lang.String[] args)
-
-