15
15
[org.apache.spark.sql.types StructType StructField
16
16
DataTypes DataType]
17
17
[tech.v3.datatype ObjectReader]
18
- [tech.v3.dataset SimpleRDD]
19
18
[java.time LocalDate Instant]
20
19
[java.util List]))
21
20
167
166
(ds->spark-dataset ds session nil )))
168
167
169
168
170
- (defn default-ds-fn
171
- [src]
172
- (-> (ds-io/->dataset src)
173
- (prepare-ds-for-spark )
174
- (dataset->row-list )))
175
169
176
170
177
- (defn ds-src-data->rdd
178
- " Given a session, a full namespaced name that resolves to an IFn,
179
- and a list of serializable data produce an RDD."
180
- (^Dataset [^SparkSession spark-session
181
- ^String ds-fn-name
182
- ds-src-data]
183
- (SimpleRDD. (.sparkContext spark-session)
184
- (vec ds-src-data)
185
- ds-fn-name)))
186
-
187
-
188
- (comment
189
- (require '[zero-one.geni.core :as g])
190
- (require '[zero-one.geni.defaults :as geni-defaults])
191
- (def dataframe (g/read-csv! " test/data/stocks.csv" ))
192
- (require '[tech.v3.dataset :as ds])
193
- (def stocks (ds/->dataset " test/data/stocks.csv" ))
194
- (def session @geni-defaults /spark )
195
- (def schema (-> (ds/->dataset " test/data/stocks.csv" )
196
- (prepare-ds-for-spark )
197
- (ds-schema )))
198
- (def rdd (ds-src-data->dataset @geni-defaults/spark
199
- schema
200
- " tech.v3.libs.spark/default-ds-fn"
201
- [[{:a 1 } {:a 2 }]]))
202
- )
203
-
204
171
205
172
(defn collect-spark-dataset->ds
206
173
[^Dataset dataset]
227
194
nil
228
195
[]))))
229
196
(ds-impl/new-dataset ))))
197
+
198
+
199
+
200
+ (comment
201
+ ; ; databricks-connect specific classes
202
+ ; ; should work similar for spark-connect
203
+
204
+ ; ;Tested with hese deps
205
+ ; ;org.scala-lang/scala-reflect {:mvn/version "2.12.18"}
206
+ ; ;com.databricks/databricks-connect {:mvn/version "16.1.0"}
207
+
208
+
209
+ (import
210
+ '[com.databricks.connect DatabricksSession]
211
+ '[com.databricks.sdk.core DatabricksConfig])
212
+
213
+ (def config (.. (DatabricksConfig. ) (setProfile " adb-xxxxx" )))
214
+ (def spark (.. (DatabricksSession/builder ) (sdkConfig config) getOrCreate))
215
+
216
+ (->
217
+ (.sql spark " show catalogs;" )
218
+ collect-spark-dataset->ds)
219
+
220
+ )
0 commit comments