Class SparkRowSource

  • All Implemented Interfaces:
    java.lang.AutoCloseable, java.util.Iterator<org.gorpipe.gor.model.Row>

    public class SparkRowSource
    extends gorsat.process.ProcessSource
    Created by sigmar on 12/02/16.
    • Nested Class Summary

      • Nested classes/interfaces inherited from class org.gorpipe.gor.model.GenomicIterator

        org.gorpipe.gor.model.GenomicIterator.ChromoLookup
    • Constructor Summary

      Constructors 
      Constructor Description
      SparkRowSource​(java.lang.String[] cmds, java.lang.String type, boolean nor, org.gorpipe.gor.session.GorSession gpSession, java.lang.String chr, int pos, int end, int bs)  
      SparkRowSource​(java.lang.String sql, java.lang.String profile, java.lang.String parquet, java.lang.String type, boolean nor, org.gorpipe.spark.GorSparkSession gpSession, java.lang.String filter, java.lang.String filterFile, java.lang.String filterColumn, java.lang.String splitFile, java.lang.String chr, int pos, int end, boolean usestreaming, java.lang.String jobId, boolean useCpp, java.lang.String parts, int buckets, boolean tag)  
    • Method Summary

      All Methods Static Methods Instance Methods Concrete Methods 
      Modifier and Type Method Description
      static org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> analyse​(org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset, java.lang.String gor)  
      java.lang.String checkNested​(java.lang.String cmd, org.gorpipe.gor.session.GorSession gpSession, java.lang.String[] errorStr)  
      static boolean checkNor​(org.apache.spark.sql.types.StructField[] fields)  
      org.apache.spark.sql.Dataset<? extends org.gorpipe.gor.model.Row> checkRowFormat​(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset)  
      void close()  
      org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> getDataset()  
      java.lang.String getHeader()  
      void gor()  
      void gorpipe​(gorsat.Commands.Analysis pipeStep, boolean gor)  
      static org.apache.spark.sql.Dataset<org.gorpipe.gor.model.Row> gorpipe​(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset, java.lang.String gor)  
      boolean hasNext()  
      void init()  
      boolean isBuffered()  
      boolean isNor()  
      static void main​(java.lang.String[] args)  
      org.gorpipe.gor.model.Row next()  
      boolean pushdownCalc​(java.lang.String formula, java.lang.String colName)  
      boolean pushdownCmd​(java.lang.String cmd)  
      boolean pushdownFilter​(java.lang.String gorwhere)  
      boolean pushdownGor​(java.lang.String gor)  
      boolean pushdownSelect​(java.lang.String[] cols)  
      boolean pushdownTop​(int limit)  
      boolean pushdownWrite​(java.lang.String filename)  
      static org.apache.spark.sql.types.StructType schemaFromRow​(java.lang.String[] header, org.gorpipe.gor.model.Row row)  
      void setPosition​(java.lang.String seekChr, int seekPos)  
      java.io.InputStream setRange​(java.lang.String seekChr, int startPos, int endPos)  
      • Methods inherited from class org.gorpipe.model.gor.iterators.RowSource

        bufferSize, bufferSize_$eq, getAvgBasesPerMilliSecond, getAvgBatchSize, getAvgRowsPerMilliSecond, getAvgSeekTimeMilliSecond, getBufferSize, getCurrentBatchLoc, getCurrentBatchRow, getCurrentBatchSize, getGorHeader, getParent, moveToPosition, moveToPosition$default$3, next, parent, parent_$eq, seek, setBufferSize, setParent, terminateReading
      • Methods inherited from class org.gorpipe.gor.model.GenomicIterator

        clone, decStat, filter, getColnum, getContext, getEx, getLookup, getMonitor, getSourceName, incStat, init, initStats, isSourceAlreadyInserted, seek, select, selectHeader, setColnum, setContext, setEx, setHeader, setSourceAlreadyInserted, setSourceName
      • Methods inherited from class java.lang.Object

        equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
      • Methods inherited from interface java.util.Iterator

        forEachRemaining, remove
    • Constructor Detail

      • SparkRowSource

        public SparkRowSource​(java.lang.String sql,
                              java.lang.String profile,
                              java.lang.String parquet,
                              java.lang.String type,
                              boolean nor,
                              org.gorpipe.spark.GorSparkSession gpSession,
                              java.lang.String filter,
                              java.lang.String filterFile,
                              java.lang.String filterColumn,
                              java.lang.String splitFile,
                              java.lang.String chr,
                              int pos,
                              int end,
                              boolean usestreaming,
                              java.lang.String jobId,
                              boolean useCpp,
                              java.lang.String parts,
                              int buckets,
                              boolean tag)
                       throws java.io.IOException,
                              java.util.zip.DataFormatException
        Throws:
        java.io.IOException
        java.util.zip.DataFormatException
      • SparkRowSource

        public SparkRowSource​(java.lang.String[] cmds,
                              java.lang.String type,
                              boolean nor,
                              org.gorpipe.gor.session.GorSession gpSession,
                              java.lang.String chr,
                              int pos,
                              int end,
                              int bs)
    • Method Detail

      • init

        public void init()
      • isNor

        public boolean isNor()
      • getDataset

        public org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> getDataset()
      • gorpipe

        public void gorpipe​(gorsat.Commands.Analysis pipeStep,
                            boolean gor)
      • gorpipe

        public static org.apache.spark.sql.Dataset<org.gorpipe.gor.model.Row> gorpipe​(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset,
                                                                                      java.lang.String gor)
      • gor

        public void gor()
      • schemaFromRow

        public static org.apache.spark.sql.types.StructType schemaFromRow​(java.lang.String[] header,
                                                                          org.gorpipe.gor.model.Row row)
      • checkNested

        public java.lang.String checkNested​(java.lang.String cmd,
                                            org.gorpipe.gor.session.GorSession gpSession,
                                            java.lang.String[] errorStr)
      • checkNor

        public static boolean checkNor​(org.apache.spark.sql.types.StructField[] fields)
      • hasNext

        public boolean hasNext()
        Specified by:
        hasNext in interface java.util.Iterator<org.gorpipe.gor.model.Row>
        Overrides:
        hasNext in class org.gorpipe.gor.model.GenomicIterator
      • next

        public org.gorpipe.gor.model.Row next()
        Specified by:
        next in interface java.util.Iterator<org.gorpipe.gor.model.Row>
        Overrides:
        next in class org.gorpipe.gor.model.GenomicIterator
      • setPosition

        public void setPosition​(java.lang.String seekChr,
                                int seekPos)
        Specified by:
        setPosition in class org.gorpipe.model.gor.iterators.RowSource
      • close

        public void close()
        Specified by:
        close in interface java.lang.AutoCloseable
        Specified by:
        close in class org.gorpipe.model.gor.iterators.RowSource
      • setRange

        public java.io.InputStream setRange​(java.lang.String seekChr,
                                            int startPos,
                                            int endPos)
        Specified by:
        setRange in class gorsat.process.ProcessSource
      • getHeader

        public java.lang.String getHeader()
        Overrides:
        getHeader in class org.gorpipe.gor.model.GenomicIterator
      • isBuffered

        public boolean isBuffered()
        Overrides:
        isBuffered in class org.gorpipe.gor.model.GenomicIterator
      • checkRowFormat

        public org.apache.spark.sql.Dataset<? extends org.gorpipe.gor.model.Row> checkRowFormat​(org.apache.spark.sql.Dataset<? extends org.apache.spark.sql.Row> dataset)
      • pushdownFilter

        public boolean pushdownFilter​(java.lang.String gorwhere)
        Overrides:
        pushdownFilter in class org.gorpipe.gor.model.GenomicIterator
      • pushdownCalc

        public boolean pushdownCalc​(java.lang.String formula,
                                    java.lang.String colName)
        Overrides:
        pushdownCalc in class org.gorpipe.gor.model.GenomicIterator
      • pushdownSelect

        public boolean pushdownSelect​(java.lang.String[] cols)
        Overrides:
        pushdownSelect in class org.gorpipe.gor.model.GenomicIterator
      • pushdownWrite

        public boolean pushdownWrite​(java.lang.String filename)
        Overrides:
        pushdownWrite in class org.gorpipe.gor.model.GenomicIterator
      • pushdownCmd

        public boolean pushdownCmd​(java.lang.String cmd)
        Overrides:
        pushdownCmd in class org.gorpipe.gor.model.GenomicIterator
      • analyse

        public static org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> analyse​(org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset,
                                                                                     java.lang.String gor)
      • pushdownGor

        public boolean pushdownGor​(java.lang.String gor)
        Overrides:
        pushdownGor in class org.gorpipe.gor.model.GenomicIterator
      • pushdownTop

        public boolean pushdownTop​(int limit)
        Overrides:
        pushdownTop in class org.gorpipe.gor.model.GenomicIterator
      • main

        public static void main​(java.lang.String[] args)