CoreDseGraphFrame

Instance Constructors

new CoreDseGraphFrame(graphFrame: GraphFrame, graphKeyspace: GraphKeyspace, name: Option[String] = None, graphOptions: Map[String, String] = Map.empty)

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def E(edgesIds: AnyRef*): DseGraphTraversal[Edge]

Return graph traversal that supports a subset of TinkerPop3 traversal steps
Return graph traversal that supports a subset of TinkerPop3 traversal steps
edgesIds
to start traverse with
returns
GraphTraversal[Edge] for the filtered graph

Definition Classes
DseGraphFrame
Annotations
@varargs()
def E: DseGraphTraversal[Edge]

Return graph traversal that supports a subset of TinkerPop3 traversal steps
Return graph traversal that supports a subset of TinkerPop3 traversal steps
returns
GraphTraversal[Edge] for the graph

Definition Classes
DseGraphFrame
def V(vertexIds: AnyRef*): DseGraphTraversal[Vertex]

Return graph traversal that supports subset of TinkerPop3 traversal steps
Return graph traversal that supports subset of TinkerPop3 traversal steps
vertexIds
to start traverse with
returns
GraphTraversal[Vertex] for the filtered graph

Definition Classes
DseGraphFrame
Annotations
@varargs()
def V: DseGraphTraversal[Vertex]

Return graph traversal that supports subset of TinkerPop3 traversal steps
Return graph traversal that supports subset of TinkerPop3 traversal steps
returns
GraphTraversal[Vertex] for the graph

Definition Classes
DseGraphFrame
final def asInstanceOf[T0]: T0

Definition Classes
Any
def cache(): CoreDseGraphFrame.this.type

proxy call to gf.cache()
proxy call to gf.cache()
returns
this

Definition Classes
DseGraphFrame
def cleanUp: String

Remove any invalid edge entries from the database backend.
Remove any invalid edge entries from the database backend.

Definition Classes
DseGraphFrame
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
val clusterName: String

Attributes
protected
Definition Classes
DseGraphFrame
lazy val connector: CassandraConnector

Attributes
protected
Definition Classes
DseGraphFrame
val connectorOptions: Map[String, String]

Attributes
protected
Definition Classes
DseGraphFrame
def deleteEdgeProperties(df: DataFrame, properties: String*): Unit

clean edges properties
clean edges properties
properties
delete only selected properties not entire row

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def deleteEdgeProperties(df: DataFrame, properties: Array[String]): Unit
def deleteEdges(df: DataFrame, cache: Boolean = true): Unit

delete graph edges.
delete graph edges. 4 id columns should be passed to the method
```
+--------------------+--------------------+-------+--------------------+
|                 src|                 dst| ~label|                  id|
+--------------------+--------------------+-------+--------------------+
|god:THxdAAAAAAAAAAAA|titan:J474AAAAAAA...| father|da0a9900-8fe1-11e...|
+--------------------+--------------------+-------+--------------------+
```
df
data frame with edge ids: src,dst,~label, id
cache
cache df before processing, true by default for consistence updates. two C* entries need to be deleted for one edge, so no reloads expected between this two calls.

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def deleteEdges(df: DataFrame): Unit

shortcut for deleteEdges(df: DataFrame, cache: Boolean = true) for Java
shortcut for deleteEdges(df: DataFrame, cache: Boolean = true) for Java

Definition Classes
DseGraphFrame
def deleteVertexProperties(df: DataFrame, properties: Seq[String], labels: Seq[String] = Seq.empty, cache: Boolean = true): Unit

clean vertex properties with meta properties
clean vertex properties with meta properties
properties
property names to delete

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def deleteVertexProperties(df: DataFrame, properties: String*): Unit

clean vertex properties with meta properties
clean vertex properties with meta properties
properties
property names to delete

Definition Classes
DseGraphFrame
Annotations
@varargs()
def deleteVertices(label: String): Unit

delete all vertices with given label
delete all vertices with given label

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def deleteVertices(df: DataFrame, labels: Seq[String] = Seq.empty, cache: Boolean = true): Unit

df
should contains "id" column to delete
labels
(optional) speed up deletion by providing list of affected labels
cache
true by default. the df will be cached before processing.

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def dropIsolatedVertices(): DseGraphFrame

proxy call to gf.dropIsolatedVertices()
proxy call to gf.dropIsolatedVertices()
returns
new filtered DseGraphFrame

Definition Classes
DseGraphFrame
var dseGraphName: Option[String]

Attributes
protected
Definition Classes
DseGraphFrame
lazy val edgeIdColumnNames: Seq[String]

Definition Classes
CoreDseGraphFrame → DseGraphFrame
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def filterEdges(conditionExpr: String): DseGraphFrame

proxy call to gf.filterEdges()
proxy call to gf.filterEdges()
returns
new filtered DseGraphFrame

Definition Classes
DseGraphFrame
def filterEdges(condition: Column): DseGraphFrame

proxy call to gf.filterEdges()
proxy call to gf.filterEdges()
returns
new filtered DseGraphFrame

Definition Classes
DseGraphFrame
def filterVertices(conditionExpr: String): DseGraphFrame

proxy call to gf.filterVertices()
proxy call to gf.filterVertices()
returns
new filtered DseGraphFrame

Definition Classes
DseGraphFrame
def filterVertices(condition: Column): DseGraphFrame

proxy call to gf.filterVertices()
proxy call to gf.filterVertices()
returns
new filtered DseGraphFrame

Definition Classes
DseGraphFrame
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def getEdgeLabelFromSchema(outVertexLabel: String, edgeLabel: String, inVertexLabel: String): EdgeLabel
val gf: GraphFrame

Definition Classes
DseGraphFrame
val graphKeyspace: GraphKeyspace
def graphName: String

Returns the graph name of this DseGraphFrame.
Returns the graph name of this DseGraphFrame.

Definition Classes
DseGraphFrame
Exceptions thrown
NoSuchElementException if the graph name is not set.
val graphOptions: Map[String, String]

Definition Classes
DseGraphFrame
def hashCode(): Int

Definition Classes
AnyRef → Any
def idColumn(labelColumn: Column, idColumns: Column*): Column

Utility method to generate GraphFrame compatible ids, if a mixed set of labels is in the DF.
Utility method to generate GraphFrame compatible ids, if a mixed set of labels is in the DF. It is slower than idColumn(label: String, idColumns: Column*): Column The id is added automatically when vertex is inserted, if inserted columns has the same names as in graph schema It is not possible for edges as you need to point both src and dst ids. Usage:
```
val updateEdgeDF = sourceDF.select(
  gf.idColumn(col("srcLabel"), col("srcId")) as "src",
  gf.idColumn(col("dstLabel"), col("dstId")) as "dst",
  col("label") as "~label",
  gf.randomEdgeIdColumn,
  col("property"))

gf.updateEdges(updateEdgeDF)
```
If different labels have different id format use case statement to sort them:
```
when(col("srcLabel") === "1format", col("src1Id")).when(col("srcLabel") === "2format", col("src2Id")).otherwise(col("src3Id")) as "src"
```
Definition Classes
CoreDseGraphFrame → DseGraphFrame
Annotations
@varargs()
def idColumn(label: String, idColumns: Column*): Column

Utility method to generate GraphFrame compatible ids.
Utility method to generate GraphFrame compatible ids. The id is added automatically when vertex is inserted, if inserted columns has the same names as in graph schema It is not possible for edges as you need to point both src and dst ids. Usage:
```
val updateEdgeDF = sourceDF.select(
  gf.idColumn("srcLabel", col("srcId")) as "src",
  gf.idColumn("dstLabel", col("dstId")) as "dst",
  col("label") as "~label",
  gf.randomEdgeIdColumn,
  col("property"))

gf.updateEdges(updateEdgeDF)
```
Definition Classes
CoreDseGraphFrame → DseGraphFrame
Annotations
@varargs()
def io(url: String): DseGraphTraversal[Vertex]

Performs a read or write based operation on the Graph backing this GraphTraversalSource.
Performs a read or write based operation on the Graph backing this GraphTraversalSource. This step can be accompanied by the Object) modulator for further configuration and must be accompanied by a GraphTraversal#read() or GraphTraversal#write() modulator step which will terminate the traversal.
url
the url of file in distributed file system or JDBC connection or the name of file in default file system for which the read or write will apply - note that the context of how this parameter is used is wholly dependent on the implementation. i.e cassandra read/writer implementation will ignore this path and read table name from parameters.
returns
the traversal with the { @link IoStep} added

Definition Classes
DseGraphFrame
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def persist(storageLevel: StorageLevel): CoreDseGraphFrame.this.type

proxy call to gf.persist()
proxy call to gf.persist()
returns
this

Definition Classes
DseGraphFrame
def persist(): CoreDseGraphFrame.this.type

proxy call to gf.persist()
proxy call to gf.persist()
returns
this

Definition Classes
DseGraphFrame
lazy val spark: SparkSession

Attributes
protected
Definition Classes
DseGraphFrame
lazy val sqlContext: SQLContext

Attributes
protected
Definition Classes
DseGraphFrame
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toExternalEdgeId(label: String, srcId: String, dstId: String, ids: Seq[Any], schema: StructType): AnyRef

label
Edge label
srcId
Source vertex id
dstId
Destination vertex id
ids
Edge ids
schema
Associated DataFrame schema
returns
External ID object

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def toExternalVertexId(id: String): AnyRef

id
String of vertex ID in the form "label:columnData:checkSum(data)"
returns
External ID object

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def toString(): String

Definition Classes
AnyRef → Any
def unpersist(blocking: Boolean): CoreDseGraphFrame.this.type

proxy call to gf.unpersist()
proxy call to gf.unpersist()
returns
this

Definition Classes
DseGraphFrame
def unpersist(): CoreDseGraphFrame.this.type

proxy call to gf.unpersist()
proxy call to gf.unpersist()
returns
this

Definition Classes
DseGraphFrame

def updateEdges(outVertexLabel: String, edgeLabel: String, inVertexLabel: String, df: DataFrame): Unit

Update or insert edges.

Update or insert edges. Edge id column names should be the same as in the underlying DSE-DB table.

For example, suppose we have the following edge label definition (Core Graph)

schema.edgeLabel('created')
  .ifNotExists()
  .from('person').to('software')
  .property('weight', Double)
  .create()

with the corresponding CQL table definition

CREATE TABLE test.person__created__software (
  person_name text,
  person_ssn text,
  person_age int,
  software_name text,
  software_version text,
  software_lang text,
  weight double,
  PRIMARY KEY ((person_name, person_ssn), person_age, software_name, software_version, software_lang)
) WITH CLUSTERING ORDER BY (person_age ASC, software_name ASC, software_version ASC, software_lang ASC)

In this example, we have "person" and "software" vertex labels (not shown) that are connected with a "created" edge label.

Edge updates can be carried out like this

scala> g.updateEdges("person", "created", "software", createdDF)

where the dataframe has the following column names, note they match the corresponding DSE-DB edge table column names

scala> createdDF.show
+-----------+-----------+----------+-------------+----------------+-------------+------+
|person_name| person_ssn|person_age|software_name|software_version|software_lang|weight|
+-----------+-----------+----------+-------------+----------------+-------------+------+
|      rocco|111-11-1111|        21|         chat|             1.0|        scala|   2.0|
+-----------+-----------+----------+-------------+----------------+-------------+------+

Note: The dataframe is not cached by this function. The dataframe should be persisted by the user if a dynamic data source is used.

df: data frame with edge ids and update columns

Definition Classes: CoreDseGraphFrame → DseGraphFrame

def updateEdges(df: DataFrame, cache: Boolean = true): Unit

update this graph edges.
update this graph edges. the minimal df schema is: 4 id columns and at least one property to update
```
+--------------------+--------------------+-------+--------------------+-------------------+
|                 src|                 dst| ~label|                  id|               prop|
+--------------------+--------------------+-------+--------------------+-------------------+
|god:THxdAAAAAAAAAAAA|titan:J474AAAAAAA...| father|da0a9900-8fe1-11e...|              value|
+--------------------+--------------------+-------+--------------------+-------------------+
```
if ID column is not present it will be generated and edges will be saved as new.
df
data frame with edge ids and update columns
cache
cache df before processing, true by default for consistence updates. two C* entries need to be updated for one edge, so no reloads expected between this two calls.

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def updateEdges(df: DataFrame): Unit

shortcut for updateEdges(df: DataFrame, cache: Boolean = true) for Java
shortcut for updateEdges(df: DataFrame, cache: Boolean = true) for Java

Definition Classes
DseGraphFrame
def updateVertices(vertexLabel: String, df: DataFrame): Unit

update this graph vertices with properties provided in the df.
update this graph vertices with properties provided in the df. you should provide id in non encoded format
```
+-----------------+---------+---------+
|     community_id|member_id|      age|
+-----------------+---------+---------+
|       1182054400|        0|        0|
+-----------------+---------+---------+
```
the df is not cached by the function.
vertexLabel
to update
df
dataframe with vertex id and update columns

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def updateVertices(df: DataFrame, labels: Seq[String] = Seq.empty, cache: Boolean = true): Unit

update this graph vertices with properties provided in the df.
update this graph vertices with properties provided in the df. the minimal df schema is just vertex "id" and one property to update:
```
+-----------------+---------+
|               id|      age|
+-----------------+---------+
|god:AAAAATMAAA...|        0|
+-----------------+---------+
```
label and vertices id will be extracted from the graph frame id. for better performance it is recommended to add/leave "~label" column
```
+-----------------+---------+---------+
|               id|   ~label|      age|
+-----------------+---------+---------+
|god:AAAAATMAAA...|      god|        0|
+-----------------+---------+---------+
```
you can also provide id in non encoded format
```
+-----------------+---------+---------+---------+
|     community_id|member_id|   ~label|      age|
+-----------------+---------+---------+---------+
|       1182054400|        0|      god|        0|
+-----------------+---------+---------+---------+
```
Note: passing both synthetic "id" and vertex Id columns is an error.
df
dataframe with vertex id and update columns
labels
empty (means all) by default, it is convenient to group vertexes with the same id format. That group could be passed here, to reduce number of verification steps
cache
cache df before processing, true by default for consistence update and performance

Definition Classes
CoreDseGraphFrame → DseGraphFrame
def updateVertices(df: DataFrame): Unit

shortcut for updateVertices(df: DataFrame, labels: Seq[String] = Seq.empty, cache: Boolean = true) for Java API
shortcut for updateVertices(df: DataFrame, labels: Seq[String] = Seq.empty, cache: Boolean = true) for Java API
df
dataframe with vertex id and update columns

Definition Classes
DseGraphFrame
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
def withCachedDf[T](df: DataFrame, cache: Boolean)(code: ⇒ T): T

Attributes
protected
Definition Classes
DseGraphFrame

Related Docs: object CoreDseGraphFrame | package dsedb

class CoreDseGraphFrame extends DseGraphFrame

Instance Constructors

new CoreDseGraphFrame(graphFrame: GraphFrame, graphKeyspace: GraphKeyspace, name: Option[String] = None, graphOptions: Map[String, String] = Map.empty)

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

def E(edgesIds: AnyRef*): DseGraphTraversal[Edge]

def E: DseGraphTraversal[Edge]

def V(vertexIds: AnyRef*): DseGraphTraversal[Vertex]

def V: DseGraphTraversal[Vertex]

final def asInstanceOf[T0]: T0

def cache(): CoreDseGraphFrame.this.type

def cleanUp: String

def clone(): AnyRef

val clusterName: String

lazy val connector: CassandraConnector

val connectorOptions: Map[String, String]

def deleteEdgeProperties(df: DataFrame, properties: String*): Unit

def deleteEdgeProperties(df: DataFrame, properties: Array[String]): Unit

def deleteEdges(df: DataFrame, cache: Boolean = true): Unit

def deleteEdges(df: DataFrame): Unit

def deleteVertexProperties(df: DataFrame, properties: Seq[String], labels: Seq[String] = Seq.empty, cache: Boolean = true): Unit

def deleteVertexProperties(df: DataFrame, properties: String*): Unit

def deleteVertices(label: String): Unit

def deleteVertices(df: DataFrame, labels: Seq[String] = Seq.empty, cache: Boolean = true): Unit

def dropIsolatedVertices(): DseGraphFrame

var dseGraphName: Option[String]

lazy val edgeIdColumnNames: Seq[String]

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def filterEdges(conditionExpr: String): DseGraphFrame

def filterEdges(condition: Column): DseGraphFrame

def filterVertices(conditionExpr: String): DseGraphFrame

def filterVertices(condition: Column): DseGraphFrame

def finalize(): Unit

final def getClass(): Class[_]

def getEdgeLabelFromSchema(outVertexLabel: String, edgeLabel: String, inVertexLabel: String): EdgeLabel

val gf: GraphFrame

val graphKeyspace: GraphKeyspace

def graphName: String

val graphOptions: Map[String, String]

def hashCode(): Int

def idColumn(labelColumn: Column, idColumns: Column*): Column

def idColumn(label: String, idColumns: Column*): Column

def io(url: String): DseGraphTraversal[Vertex]

final def isInstanceOf[T0]: Boolean

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def persist(storageLevel: StorageLevel): CoreDseGraphFrame.this.type

def persist(): CoreDseGraphFrame.this.type

lazy val spark: SparkSession

lazy val sqlContext: SQLContext

final def synchronized[T0](arg0: ⇒ T0): T0

def toExternalEdgeId(label: String, srcId: String, dstId: String, ids: Seq[Any], schema: StructType): AnyRef

def toExternalVertexId(id: String): AnyRef

def toString(): String

def unpersist(blocking: Boolean): CoreDseGraphFrame.this.type

def unpersist(): CoreDseGraphFrame.this.type

def updateEdges(outVertexLabel: String, edgeLabel: String, inVertexLabel: String, df: DataFrame): Unit

def updateEdges(df: DataFrame, cache: Boolean = true): Unit

def updateEdges(df: DataFrame): Unit

def updateVertices(vertexLabel: String, df: DataFrame): Unit

def updateVertices(df: DataFrame, labels: Seq[String] = Seq.empty, cache: Boolean = true): Unit

def updateVertices(df: DataFrame): Unit

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

def withCachedDf[T](df: DataFrame, cache: Boolean)(code: ⇒ T): T

Inherited from DseGraphFrame

Inherited from Serializable

Inherited from Serializable

Inherited from AnyRef

Inherited from Any

Ungrouped