-- Create a simple tableCREATETABLEusers(idBIGINTNOTNULL,nameSTRING,emailSTRING,created_atTIMESTAMP);-- Create table with complex data typesCREATETABLEevents(event_idBIGINTNOTNULL,user_idBIGINT,event_typeSTRING,tagsARRAY<STRING>,metadataSTRUCT<source:STRING,version:INT,processed_at:TIMESTAMP>,occurred_atTIMESTAMP);
# Create DataFramedata=[(1,"Alice","alice@example.com"),(2,"Bob","bob@example.com"),(3,"Charlie","charlie@example.com")]df=spark.createDataFrame(data,["id","name","email"])# Write as new table using catalogdf.writeTo("users").create()
importspark.implicits._// Create DataFramevaldata=Seq((1,"Alice","alice@example.com"),(2,"Bob","bob@example.com"),(3,"Charlie","charlie@example.com"))valdf=data.toDF("id","name","email")// Write as new table using catalogdf.writeTo("users").create()
importorg.apache.spark.sql.types.*;importorg.apache.spark.sql.Row;importorg.apache.spark.sql.RowFactory;// Create DataFrameList<Row>data=Arrays.asList(RowFactory.create(1L,"Alice","alice@example.com"),RowFactory.create(2L,"Bob","bob@example.com"),RowFactory.create(3L,"Charlie","charlie@example.com"));StructTypeschema=newStructType(newStructField[]{newStructField("id",DataTypes.LongType,false,Metadata.empty()),newStructField("name",DataTypes.StringType,true,Metadata.empty()),newStructField("email",DataTypes.StringType,true,Metadata.empty())});Dataset<Row>df=spark.createDataFrame(data,schema);// Write as new table using catalogdf.writeTo("users").create();
# Create new datanew_data=[(8,"Henry","henry@example.com"),(9,"Ivy","ivy@example.com")]new_df=spark.createDataFrame(new_data,["id","name","email"])# Append to existing tablenew_df.writeTo("users").append()# Alternative: use traditional write API with modenew_df.write.mode("append").saveAsTable("users")
// Create new datavalnewData=Seq((8,"Henry","henry@example.com"),(9,"Ivy","ivy@example.com"))valnewDF=newData.toDF("id","name","email")// Append to existing tablenewDF.writeTo("users").append()// Alternative: use traditional write API with modenewDF.write.mode("append").saveAsTable("users")
// Create new dataList<Row>newData=Arrays.asList(RowFactory.create(8L,"Henry","henry@example.com"),RowFactory.create(9L,"Ivy","ivy@example.com"));Dataset<Row>newDF=spark.createDataFrame(newData,schema);// Append to existing tablenewDF.writeTo("users").append();// Alternative: use traditional write API with modenewDF.write().mode("append").saveAsTable("users");