Sparkã§ãã¼ã¿å¦çããã°ã©ã ãæ¸ãããã®APIã«ã¯ãRDDã¨DataFrameã®äºç¨®é¡ãããã2ã¤ã®APIãç¨ãã¦wordcountãæ¸ãã¦ã¿ããwordcountã¯ãããã¹ãä¸ã®åèªã®åºç¾åæ°ãæ°ããããã°ã©ã ã§ããã忣ãã¼ã¿å¦çã®å¿ 修課é¡ã§ããã RDDã¯ä½ã¬ãã«ãªAPIã§ããã¼ã¿ã®ã¬ã³ã¼ãã«ã¯ã¹ãã¼ãããªãããã¼ã¿å¦çã¯ãmap颿°ãflatMap颿°ãªã©ãªã¹ãå¦ççãªé«é颿°ã«ãã£ã¦è¨è¿°ãããreduceByKeyãªã©ããã¤ãã®æä½ã¯ãã¬ã³ã¼ãã(key, value)ã®ã¿ãã«ã§ãããã¨ãè¦æ±ãããããã®æ¤æ»ã¯ã¸ã§ãæå ¥æã§ã¯ãªããã¿ã¹ã¯å®è¡æã«è¡ããããç·ãã¦ãå¤å¼ããããMapReduceã®æè¦ã§æ±ããã DataFrameã¯é«ã¬ãã«ã®APIã§ããã¼ã¿ã®ã¬ã³ã¼ãã«ã¯ã¹ãã¼ããé©ç¨ãããããã¼ã¿å¦çã¯ãSQLã«ãã£ã¦è¨è¿°ãããããããã¯ãã¹ãè¨èªä¸ã®DSLï¼ä»¥ä¸ã¯ã¨ãªDSL


{{#tags}}- {{label}}
{{/tags}}