3
Collecting dbldatagen
Using cached dbldatagen-0.4.0.post1-py3-none-any.whl.metadata (9.9 kB)
Using cached dbldatagen-0.4.0.post1-py3-none-any.whl (122 kB)
Installing collected packages: dbldatagen
Successfully installed dbldatagen-0.4.0.post1
[notice] A new release of pip is available: 24.0 -> 25.0.1
[notice] To update, run: pip install --upgrade pip
4
synthetic_data_1739557219
8
Warning: classes defined within packages cannot be redefined without a cluster restart.
Compilation successful.
10
import org.apache.spark.sql.execution.streaming.state.RocksDBStateStoreProvider
import java.util.UUID
import org.apache.spark.sql.streaming.StatefulProcessor
import org.apache.spark.sql.streaming._
import java.sql.Timestamp
import org.apache.spark.sql.Encoders
import org.apache.spark.sql.streaming.MS._
12
defined class SCDType2StatefulProcessor
14
inputStream: org.apache.spark.sql.Dataset[org.apache.spark.sql.streaming.MS.UserLocation] = [user: string, time: timestamp ... 1 more field]
16
baseLocation: String = /Workspace/Users/bo.gao@databricks.com/tws/fd8d30f8-d135-4349-927d-ea6b4b56f843
checkpointLocation: String = /Workspace/Users/bo.gao@databricks.com/tws/fd8d30f8-d135-4349-927d-ea6b4b56f843/checkpoint
outputTable: String = /Workspace/Users/bo.gao@databricks.com/tws/fd8d30f8-d135-4349-927d-ea6b4b56f843/output
18
19
res17: Boolean = true