1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
|
json_tuple(jsonCol:Column, fields:String*) get_json_object(jsonCol:Column, path:String)
val schema: StructType = StructType(Seq( StructField("name", StringType), StructField("age", IntegerType), StructField("isMember", BooleanType), StructField("salary", FloatType) )) from_json(json:Column,schema:StructType).as(alia:String) from_json(lit("{\"name\":\"张三\",\"age\":22,\"isMember\":false,\"salary\":3566.38}"),schema).as("stu")
select($"stu.name",$"stu.age",$"stu.isMember",$"stu.salary")
val options:Map[String,String] = Map("header" -> "true", "lineSep" -> "\n") from_csv(lit("henry,22,true,3454.23"),schema,options).as("stu") select($"stu.name",$"stu.age",$"stu.isMember",$"stu.salary")
regexp_extract(col:Column, pattern:String, groupId:Int)
split(col:Column,pattern:String) substring(col:Column,pos:Int,len:Int) substring_index(col:Column,sep:String,groupId:Int)
locate(subStr:String,col:Column) instr(col:Column,subStr:String)
concat(cols:Column*) concat_ws(sep:String,cols:Column*)
length(col:Column)
lpad(col:Column,len:Int,pad:String) rpad(col:Column,len:Int,pad:String)
ltrim(col:Column) rtrim(col:Column) trim(col:Column)
initcap(col:Column) upper(col:Column) lower(col:Column)
hash(col:Column) regexp_replace(col:Column,pattern:String,replace:String) translate(col:Column,from:String,to:String) reverse(col:Column)
encode(col:Column, charSet:String) decode(col:Column, charSet:String)
sha1(col:Column) md5(col:Column)
|