cevent

hive-diea-ETL数据截取split，嵌套SQL查询，ETL-SQL表查询中间件解析

1.数据准备

2.上传数据




 
  
  [cevent@hadoop207 hadoop-2.7.2]$ cd /opt/module/datas/
  [cevent@hadoop207 datas]$ ll
  总用量
  383028
  -rw-rw-r--. 1 cevent cevent       147 5月 
  10 13:46 510test.txt
  -rw-rw-r--. 1 cevent cevent 120734753 6月   8 13:31 bigtable
  -rw-rw-r--. 1 cevent cevent       266 5月 
  17 13:52 business.txt
  -rw-rw-r--. 1 cevent cevent       129 5月 
  17 13:52 constellation.txt
  -rw-rw-r--. 1 cevent cevent        71 5月 
  17 13:52 dept.txt
  -rw-rw-r--. 1 cevent cevent        78 5月 
  17 13:52 emp_sex.txt
  drwxrwxr-x. 3 cevent cevent      4096 6月  
  5 14:17 emp.txt
  drwxrwxr-x. 4 cevent cevent      4096 5月 
  22 13:32 export
  -rw-rw-r--. 1 cevent cevent      2794 6月  
  4 22:32 hadoop_hive_userdefinedfunc_plugin-1.0-SNAPSHOT.jar
  -rw-rw-r--. 1 cevent cevent        37 5月 
  17 13:52 location.txt
  -rw-rw-r--. 1 cevent cevent  19014993 5月 
  17 13:52 log.data
  -rw-rw-r--. 1 cevent cevent       136 5月 
  17 13:52 movie.txt
  -rw-rw-r--. 1 cevent cevent 118645854 6月   9 13:20 nullid
  -rw-rw-r--. 1 cevent cevent 121734744 6月   9 13:16 ori
  -rw-rw-r--. 1 cevent cevent       213 5月 
  17 13:52 score.txt
  -rw-rw-r--. 1 cevent cevent  12018355 6月  
  8 13:31 smalltable
  drwxrwxr-x. 3 cevent cevent      4096 6月  
  5 14:18 snappy-distribute-result
  -rw-rw-r--. 1 cevent cevent       165 5月 
  17 13:52 student.txt
  -rw-rw-r--. 1 cevent cevent       301 5月 
  17 13:52 数据说明.txt
  [cevent@hadoop207 datas]$ mkdir user/
  [cevent@hadoop207 datas]$ mkdir video/
  [cevent@hadoop207 datas]$ ll
  总用量
  383036
  -rw-rw-r--. 1 cevent cevent       147 5月 
  10 13:46 510test.txt
  -rw-rw-r--. 1 cevent cevent 120734753 6月   8 13:31 bigtable
  -rw-rw-r--. 1 cevent cevent       266 5月 
  17 13:52 business.txt
  -rw-rw-r--. 1 cevent cevent       129 5月 
  17 13:52 constellation.txt
  -rw-rw-r--. 1 cevent cevent        71 5月 
  17 13:52 dept.txt
  -rw-rw-r--. 1 cevent cevent        78 5月 
  17 13:52 emp_sex.txt
  drwxrwxr-x. 3 cevent cevent      4096 6月  
  5 14:17 emp.txt
  drwxrwxr-x. 4 cevent cevent      4096 5月 
  22 13:32 export
  -rw-rw-r--. 1 cevent cevent      2794 6月  
  4 22:32 hadoop_hive_userdefinedfunc_plugin-1.0-SNAPSHOT.jar
  -rw-rw-r--. 1 cevent cevent        37 5月 
  17 13:52 location.txt
  -rw-rw-r--. 1 cevent cevent  19014993 5月 
  17 13:52 log.data
  -rw-rw-r--. 1 cevent cevent       136 5月 
  17 13:52 movie.txt
  -rw-rw-r--. 1 cevent cevent 118645854 6月   9 13:20 nullid
  -rw-rw-r--. 1 cevent cevent 121734744 6月   9 13:16 ori
  -rw-rw-r--. 1 cevent cevent       213 5月 
  17 13:52 score.txt
  -rw-rw-r--. 1 cevent cevent  12018355 6月  
  8 13:31 smalltable
  drwxrwxr-x. 3 cevent cevent      4096 6月  
  5 14:18 snappy-distribute-result
  -rw-rw-r--. 1 cevent cevent       165 5月 
  17 13:52 student.txt
  drwxrwxr-x. 2 cevent cevent      4096 6月  
  9 21:23 user
  drwxrwxr-x. 2 cevent cevent      4096 6月  
  9 21:23 video
  -rw-rw-r--. 1 cevent cevent       301 5月 
  17 13:52 数据说明.txt
  [cevent@hadoop207 datas]$ hadoop fs -mkdir /cevent_video_show
  [cevent@hadoop207 datas]$ hadoop fs -put user/ /cevent_video_show
  [cevent@hadoop207 datas]$ hadoop fs -put video/ /cevent_video_show

3.查询结果

链接: http://hadoop207.cevent.com:50070/explorer.html#/cevent_video_show/user

4.新建idea工程

5.Log4j解析




 
  
  //日志输出级别，INFO为级别，输出都会记录到stdout
  log4j.rootLogger=INFO, stdout  
  //appender：控制台追加器consoleAppender 模板布局patternLayout 转换模式conversionPattern
  log4j.appender.stdout=org.apache.log4j.ConsoleAppender  
  log4j.appender.stdout.layout=org.apache.log4j.PatternLayout  
  log4j.appender.stdout.layout.ConversionPattern=%d
  %p [%c] - %m%n  
  //logfile：文件追加器
  log4j.appender.logfile=org.apache.log4j.FileAppender  
  log4j.appender.logfile.File=target/spring.log  
  log4j.appender.logfile.layout=org.apache.log4j.PatternLayout  
  log4j.appender.logfile.layout.ConversionPattern=%d
  %p [%c] - %m%n

6.resources下新建log4j.properties




 
  
  log4j.rootLogger=INFO,
  stdout  

  log4j.appender.stdout=org.apache.log4j.ConsoleAppender  

  log4j.appender.stdout.layout=org.apache.log4j.PatternLayout  

  log4j.appender.stdout.layout.ConversionPattern=%d %p [%c] -
  %m%n  

  log4j.appender.logfile=org.apache.log4j.FileAppender  

  log4j.appender.logfile.File=target/spring.log  

  log4j.appender.logfile.layout=org.apache.log4j.PatternLayout  

  log4j.appender.logfile.layout.ConversionPattern=%d %p [%c] -
  %m%n

7.ETLMapper




 
  
  package com.cevent.hadoop.hive.etl;

  /**

   * Created by Cevent on 2020/6/9.

   */

  

  import org.apache.hadoop.io.LongWritable;

  import org.apache.hadoop.io.NullWritable;

  import org.apache.hadoop.io.Text;

  import org.apache.hadoop.mapreduce.Counter;

  import org.apache.hadoop.mapreduce.Mapper;

  

  import java.io.IOException;

  

  /**

   * @author cevent

   * @description

   *               输入类型      输出类型

   * Mapper

   * @date 2020/6/9 22:27

   */

  public class ETLMapper extends Mapper<LongWritable,Text,Text,NullWritable>{
     

  

      //单线程累加拼接

      private StringBuilder stringBuilder=new StringBuilder();

      private Text text=new Text();

      //计数器，记录日志数据

      private Counter totalData;

      private Counter passData;

  

      @Override

      protected void setup(Context context) throws IOException, InterruptedException{
     

          //s:groupName
  s1:counterName

          totalData=context.getCounter("ETL","TotalData");

          passData=context.getCounter("ETL","PassData");

      }

  

      @Override

      protected void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException
  {
     

          //1.数据切割

          String[] split=value.toString().split("\t");

  

          //获取数据载入total

          totalData.increment(1);

  

          //2.按照长度过滤，不符合条件的数组，<9的忽略

          if(split.length>=9){
     

              //去除类型的空格：People & Blogs

              split[3]=split[3].replace(" ","");

  

              //3.替换分隔符

              //拼接前，清除StringBuilder

              stringBuilder.setLength(0);

  

              //LKh7zAJ4nwo  TheReceptionist    653   
  Entertainment  424    13021 
  4.34   1305   744   
  DjdA-5oKYFQ    NxTDlnOuybo    c-8VuICzXtU    DH56yrIO5nI    W1Uo5DQTtzc    E-3zXq_r4w0    1TCeoRPg5dE    yAr26YhuYNY    2ZgXx72XmoE    -7ClGo-YgZ0    vmdPOOd6cxI    KRHfMQqSHpk    pIMpORZthYw    1tUDzOp10pk    heqocRij5P0    _XIuvoH6rUg    LGVU5DsezE0    uO2kj6_D8B4    xiDqywcDQRM    uX81lMev6_o

              //    1                 2        3        4          5   
  6      7        8     
  9       10        11          12         13           14          15

              //字段在末尾，则不拼分隔符，如果字段在末尾前一串，则加入分隔符(前9个<9 | 第10个以后)

              for (int i=0;i<split.length;i++){
     

                  //4.末尾字段，只拼字段

                  if(i==split.length-1){
     

                      stringBuilder.append(split[i]);

                  }else if(i<9){
     

                      //如果为前9个，需要拼分隔符\t

                      stringBuilder.append(split[i]).append('\t');

                  }else{
     

                      //如果为后10个，拼&

                      stringBuilder.append(split[i]).append('&');

                  }

              }

  

              //5.写入

              text.set(stringBuilder.toString());

              //6.total/pass+1

              passData.increment(1);

  

              context.write(text,NullWritable.get());

  

          }

  

      }

  }

8.ETLDriver




 
  
  package com.cevent.hadoop.hive.etl;/**

   * Created by Cevent on 2020/6/9.

   */

  

  import org.apache.hadoop.conf.Configuration;

  import org.apache.hadoop.fs.Path;

  import org.apache.hadoop.io.NullWritable;

  import org.apache.hadoop.io.Text;

  

  import org.apache.hadoop.mapreduce.Job;

  import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;

  import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;

  

  

  /**

   * @author cevent

   * @description

   * @date 2020/6/9 22:26

   */

  public class ETLDriver {
     

      public static void
  main(String[] args) throws Exception {
     

          Job job= Job.getInstance(new Configuration());

          job.setJarByClass(ETLDriver.class);

          job.setMapperClass(ETLMapper.class);

  

          job.setNumReduceTasks(0);

  

          job.setMapOutputKeyClass(Text.class);

          job.setMapOutputValueClass(NullWritable.class);

  

          FileInputFormat.setInputPaths(job,new Path(args[0]));

          FileOutputFormat.setOutputPath(job,new Path(args[1]));

  

          boolean flag=job.waitForCompletion(true);

          System.exit(flag?0:1);

      }

  }

9.打包

10.执行jar-ETL




 
  
  [cevent@hadoop207 hadoop-2.7.2]$ sbin/start-dfs.sh 
  Starting namenodes on
  [hadoop207.cevent.com]
  hadoop207.cevent.com: starting namenode,
  logging to /opt/module/hadoop-2.7.2/logs/hadoop-cevent-namenode-hadoop207.cevent.com.out
  hadoop207.cevent.com: starting datanode,
  logging to
  /opt/module/hadoop-2.7.2/logs/hadoop-cevent-datanode-hadoop207.cevent.com.out
  Starting secondary namenodes
  [hadoop207.cevent.com]
  hadoop207.cevent.com: starting
  secondarynamenode, logging to
  /opt/module/hadoop-2.7.2/logs/hadoop-cevent-secondarynamenode-hadoop207.cevent.com.out
  [cevent@hadoop207 hadoop-2.7.2]$ sbin/start-yarn.sh 
  starting yarn daemons
  starting resourcemanager, logging to
  /opt/module/hadoop-2.7.2/logs/yarn-cevent-resourcemanager-hadoop207.cevent.com.out
  hadoop207.cevent.com: starting
  nodemanager, logging to
  /opt/module/hadoop-2.7.2/logs/yarn-cevent-nodemanager-hadoop207.cevent.com.out
  [cevent@hadoop207 hadoop-2.7.2]$ jps
  4494 Jps
  4163 SecondaryNameNode
  4450 NodeManager
  3845 NameNode
  3958 DataNode
  4336 ResourceManager
  [cevent@hadoop207 hadoop-2.7.2]$ cd /opt/module/datas/
  [cevent@hadoop207 datas]$ ll
  总用量
  383044
  -rw-rw-r--. 1 cevent cevent       147 5月 
  10 13:46 510test.txt
  -rw-rw-r--. 1 cevent cevent 120734753 6月   8 13:31 bigtable
  -rw-rw-r--. 1 cevent cevent       266 5月 
  17 13:52 business.txt
  -rw-rw-r--. 1 cevent cevent       129 5月 
  17 13:52 constellation.txt
  -rw-rw-r--. 1 cevent cevent        71 5月 
  17 13:52 dept.txt
  -rw-rw-r--. 1 cevent cevent        78 5月 
  17 13:52 emp_sex.txt
  drwxrwxr-x. 3 cevent cevent      4096 6月  
  5 14:17 emp.txt
  drwxrwxr-x. 4 cevent cevent      4096 5月 
  22 13:32 export
  -rw-rw-r--. 1 cevent cevent      2794 6月  
  4 22:32 hadoop_hive_userdefinedfunc_plugin-1.0-SNAPSHOT.jar
  -rw-rw-r--. 1 cevent cevent        37 5月 
  17 13:52 location.txt
  -rw-rw-r--. 1 cevent cevent  19014993 5月 
  17 13:52 log.data
  -rw-rw-r--. 1 cevent cevent       136 5月 
  17 13:52 movie.txt
  -rw-rw-r--. 1 cevent cevent 118645854 6月   9 13:20 nullid
  -rw-rw-r--. 1 cevent cevent 121734744 6月   9 13:16 ori
  -rw-rw-r--. 1 cevent cevent       213 5月 
  17 13:52 score.txt
  -rw-rw-r--. 1 cevent cevent  12018355 6月  
  8 13:31 smalltable
  drwxrwxr-x. 3 cevent cevent      4096 6月  
  5 14:18 snappy-distribute-result
  -rw-rw-r--. 1 cevent cevent       165 5月 
  17 13:52 student.txt
  drwxrwxr-x. 2 cevent cevent      4096 6月  
  9 21:27 user
  drwxrwxr-x. 2 cevent cevent      4096 6月  
  9 21:27 video
  -rw-rw-r--. 1 cevent cevent      4874 6月 
  10 13:51 video_etl200609-1.0-SNAPSHOT.jar
  -rw-rw-r--. 1 cevent cevent       301 5月 
  17 13:52 数据说明.txt
  [cevent@hadoop207 datas]$ mv video_etl200609-1.0-SNAPSHOT.jar video_etl200609-1.0.jar
   
  [cevent@hadoop207 datas]$ 执行jar
  hadoop jar
  video_etl200609-1.0.jar com.cevent.hadoop.hive.etl.ETLDriver 
  /cevent_video_show/video
  /cevent_video_show/video_etl
  20/06/10 13:56:07 INFO client.RMProxy:
  Connecting to ResourceManager at hadoop207.cevent.com/192.168.1.207:8032
  20/06/10 13:56:07 WARN
  mapreduce.JobResourceUploader: Hadoop command-line option parsing not
  performed. Implement the Tool interface and execute your application with
  ToolRunner to remedy this.
  20/06/10 13:56:09 INFO
  input.FileInputFormat: Total input paths to process : 5
  20/06/10 13:56:09 INFO
  mapreduce.JobSubmitter: number of splits:5
  20/06/10 13:56:09 INFO
  mapreduce.JobSubmitter: Submitting tokens for job: job_1591768379763_0001
  20/06/10 13:56:10 INFO
  impl.YarnClientImpl: Submitted application application_1591768379763_0001
  20/06/10 13:56:10 INFO mapreduce.Job:
  The url to track the job:
  http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0001/
  20/06/10 13:56:10 INFO mapreduce.Job:
  Running job: job_1591768379763_0001
  20/06/10 13:56:26 INFO mapreduce.Job: Job
  job_1591768379763_0001 running in uber mode : false
  20/06/10 13:56:26 INFO
  mapreduce.Job:  map 0% reduce 0%
  20/06/10 13:56:58 INFO
  mapreduce.Job:  map 54% reduce 0%
  20/06/10 13:57:01 INFO
  mapreduce.Job:  map 63% reduce 0%
  20/06/10 13:57:05 INFO mapreduce.Job:  map 66% reduce 0%
  20/06/10 13:57:09 INFO
  mapreduce.Job:  map 75% reduce 0%
  20/06/10 13:57:13 INFO
  mapreduce.Job:  map 90% reduce 0%
  20/06/10 13:57:15 INFO
  mapreduce.Job:  map 97% reduce 0%
  20/06/10 13:57:18 INFO
  mapreduce.Job:  map 100% reduce 0%
  20/06/10 13:57:23 INFO mapreduce.Job:
  Job job_1591768379763_0001 completed successfully
  20/06/10 13:57:26 INFO mapreduce.Job:
  Counters: 32
         
  File System Counters
                  FILE: Number of bytes read=0
                  FILE: Number of bytes
  written=584515
                  FILE: Number of read
  operations=0
                  FILE: Number of large read
  operations=0
                  FILE: Number of write
  operations=0
                  HDFS: Number of bytes
  read=213621152
                  HDFS: Number of bytes
  written=212238254
                  HDFS: Number of read
  operations=25
                  HDFS: Number of large read
  operations=0
                  HDFS: Number of write
  operations=10
         
  Job Counters 
                  Launched map tasks=5
                  Data-local map tasks=5
                  Total time spent by all maps
  in occupied slots (ms)=255598
                  Total time spent by all
  reduces in occupied slots (ms)=0
                  Total time spent by all map
  tasks (ms)=255598
                  Total vcore-milliseconds
  taken by all map tasks=255598
                  Total megabyte-milliseconds
  taken by all map tasks=261732352
         
  Map-Reduce Framework
                  Map input records=749361
                  Map output records=743569
                  Input split bytes=635
                  Spilled Records=0
                  Failed Shuffles=0
                  Merged Map outputs=0
                  GC time elapsed (ms)=5302
                  CPU time spent (ms)=21270
                  Physical memory (bytes)
  snapshot=661708800
                  Virtual memory (bytes)
  snapshot=4414775296
                  Total committed heap usage
  (bytes)=310902784
         
  ETL
                  PassData=743569 转换数量6000+
                  TotalData=749361
         
  File Input Format Counters 
                  Bytes Read=213620517
         
  File Output Format Counters 
                  Bytes Written=212238254

11.校验结果

链接：http://hadoop207.cevent.com:50070/explorer.html#/cevent_video_show/video_etl

12.统计查询，多嵌套




 
  
  [cevent@hadoop207 hive-1.2.1]$ bin/beeline 
  Beeline version 1.2.1 by Apache Hive
  0: jdbc:hive2://hadoop.cevent.com:10000
  (closed)> !connect
  jdbc:hive2://hadoop207.cevent.com:10000
  Connecting to
  jdbc:hive2://hadoop207.cevent.com:10000
  Enter username for
  jdbc:hive2://hadoop207.cevent.com:10000: cevent
  Enter password for
  jdbc:hive2://hadoop207.cevent.com:10000: ******
  Connected to: Apache Hive (version 1.2.1)
  Driver: Hive JDBC (version 1.2.1)
  Transaction isolation:
  TRANSACTION_REPEATABLE_READ
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> use
  cevent01;
  No rows affected (1.423 seconds)
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> show
  tables;
  +------------------------+--+
  |        tab_name        |
  +------------------------+--+
  | big_join               |
  | c_dept                 |
  | c_emp                  |
  | emp_gender             |
  | join_dep_partition     |
  | join_original          |
  | join_original_null_id  |
  | join_original_table    |
  | join_table             |
  | locations              |
  | person_info            |
  | small_join             |
  | student                |
  | student_bucket         |
  +------------------------+--+
  14 rows selected (0.621 seconds)  创建外部表
  载入数据
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> create
  external table video_user_info(
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> uploader
  string,
  1: jdbc:hive2://hadoop207.cevent.com:10000>
  videos int,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> friends
  int
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> )
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> row
  format delimited fields terminated by '\t'
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> location
  '/cevent_video_show/user';
  No rows affected (0.141 seconds)
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> select *
  from video_user_info limit 5;
  +---------------------------+-------------------------+--------------------------+--+
  | video_user_info.uploader  |
  video_user_info.videos  |
  video_user_info.friends  |
  +---------------------------+-------------------------+--------------------------+--+
  | barelypolitical           |
  151                     | 5106                     |
  | bonk65                    |
  89                      | 144                      |
  | camelcars                 |
  26                      | 674                      |
  | cubskickass34             |
  13                      | 126                      |
  | boydism08                 |
  32                      | 50                       |
  +---------------------------+-------------------------+--------------------------+--+
  5 rows selected (0.389 seconds)  创建外部video表载入数据
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> create
  external table video_info(
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> video_id
  string,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> uploader
  string,
  1: jdbc:hive2://hadoop207.cevent.com:10000>
  age int,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> category
  array,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> length
  int,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> views
  int,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> rate
  float,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> ratings
  int,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> comments
  int,
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> related_id
  array
  1: jdbc:hive2://hadoop207.cevent.com:10000>
  )
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> row
  format delimited fields terminated by '\t'
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> collection
  items terminated by '&'
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> location
  '/cevent_video_show/video';
  No rows affected (0.22 seconds)
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> select *
  from video_info limit 5;
  +----------------------+----------------------+-----------------+----------------------+--------------------+-------------------+--------------------+---------------------+----------------------+------------------------+--+
  | video_info.video_id  |
  video_info.uploader  |
  video_info.age  |
  video_info.category  | video_info.length  | video_info.views  | 
  video_info.rate   | video_info.ratings  | video_info.comments  | video_info.related_id  |
  +----------------------+----------------------+-----------------+----------------------+--------------------+-------------------+--------------------+---------------------+----------------------+------------------------+--+
  | LKh7zAJ4nwo          |
  TheReceptionist      | 653             |
  ["Entertainment"]    | 424                | 13021             | 4.340000152587891  | 1305                | 744                  |
  ["DjdA-5oKYFQ"]        |
  | 7D0Mf4Kn4Xk          |
  periurban            | 583             | ["Music"]            | 201                | 6508              | 4.190000057220459  | 687                 | 312                  |
  ["e2k0h6tPvGc"]        |
  | n1cEq1C8oqQ          |
  Pipistrello          | 525             | ["Comedy"]           | 125                | 1687              | 4.010000228881836  | 363                 | 141                  | ["eprHhmurMHg"]        |
  | OHkEzL4Unck          |
  ichannel             | 638             | ["Comedy"]           | 299                | 8043              | 4.400000095367432  | 518                 | 371                  |
  ["eyUSTmEUQRg"]        |
  | -boOvAGNKUc          |
  mrpitifulband        | 639             | ["Music"]            | 287                | 7548              | 4.480000019073486  | 606                 | 386                  |
  ["fmUwUURgsX0"]        |
  +----------------------+----------------------+-----------------+----------------------+--------------------+-------------------+--------------------+---------------------+----------------------+------------------------+--+
  5 rows selected (0.202 seconds)  创建内部表（在hdfs上显示），记入数据局
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> create
  table video_user stored as orc as select * from video_user_info;
  INFO  : Number of reduce tasks
  is set to 0 since there's no reduce operator
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591768379763_0002
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0002/
  INFO  : Starting Job =
  job_1591768379763_0002, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0002/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591768379763_0002
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 0
  INFO  : 2020-06-10 16:47:42,449
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 16:48:01,857
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 6.59 sec
  INFO  : MapReduce Total cumulative
  CPU time: 6 seconds 590 msec
  INFO  : Ended Job =
  job_1591768379763_0002
  INFO  : Stage-4 is selected by
  condition resolver.
  INFO  : Stage-3 is filtered out
  by condition resolver.
  INFO  : Stage-5 is filtered out
  by condition resolver.
  INFO  : Moving data to:
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_16-47-23_881_9118723475356633122-1/-ext-10001
  from
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_16-47-23_881_9118723475356633122-1/-ext-10003
  INFO  : Moving data to:
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/video_user
  from
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_16-47-23_881_9118723475356633122-1/-ext-10001
  INFO  : Table
  cevent01.video_user stats: [numFiles=1, numRows=2139109, totalSize=18167783,
  rawDataSize=218189118]
  No rows affected (41.039 seconds)  创建内部表载入数据
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> create
  table video_store stored as orc as select * from video_info;
  INFO  : Number of reduce tasks
  is set to 0 since there's no reduce operator
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591768379763_0003
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0003/
  INFO  : Starting Job =
  job_1591768379763_0003, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0003/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591768379763_0003
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 0
  INFO  : 2020-06-10 16:49:01,082
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 16:49:13,566
  Stage-1 map = 31%,  reduce = 0%,
  Cumulative CPU 6.74 sec
  INFO  : 2020-06-10 16:49:18,810
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 10.78 sec
  INFO  : MapReduce Total
  cumulative CPU time: 10 seconds 780 msec
  INFO  : Ended Job =
  job_1591768379763_0003
  INFO  : Stage-4 is selected by
  condition resolver.
  INFO  : Stage-3 is filtered out
  by condition resolver.
  INFO  : Stage-5 is filtered out
  by condition resolver.
  INFO  : Moving data to: hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_16-48-50_581_7964744140492116393-1/-ext-10001
  from
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_16-48-50_581_7964744140492116393-1/-ext-10003
  INFO  : Moving data to:
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/video_store
  from
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_16-48-50_581_7964744140492116393-1/-ext-10001
  INFO  : Table
  cevent01.video_store stats: [numFiles=1, numRows=749361, totalSize=22098531,
  rawDataSize=321015240]
  No rows affected (34.551 seconds)   执行查询观看数TOP10
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> select
  * from video_info order by views desc limit 10;
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591768379763_0004
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0004/
  INFO  : Starting Job =
  job_1591768379763_0004, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0004/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591768379763_0004
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 17:13:56,985
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 17:14:14,708
  Stage-1 map = 21%,  reduce = 0%,
  Cumulative CPU 5.43 sec
  INFO  : 2020-06-10 17:14:17,853
  Stage-1 map = 67%,  reduce = 0%,
  Cumulative CPU 7.68 sec
  INFO  : 2020-06-10 17:14:20,757
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 9.3 sec
  INFO  : 2020-06-10 17:14:38,675
  Stage-1 map = 100%,  reduce = 100%,
  Cumulative CPU 12.55 sec
  INFO  : MapReduce Total
  cumulative CPU time: 12 seconds 550 msec
  INFO  : Ended Job =
  job_1591768379763_0004
  +----------------------+----------------------+-----------------+-----------------------+--------------------+-------------------+---------------------+---------------------+----------------------+------------------------+--+
  | video_info.video_id  | video_info.uploader  | video_info.age  | 
  video_info.category  |
  video_info.length  |
  video_info.views  |   video_info.rate   | video_info.ratings  | video_info.comments  | video_info.related_id  |
  +----------------------+----------------------+-----------------+-----------------------+--------------------+-------------------+---------------------+---------------------+----------------------+------------------------+--+
  | dMH0bHeiRNg          |
  judsonlaipply        | 415             | ["Comedy"]            | 360                | 42513417          | 4.679999828338623   | 87520               | 22718                |
  ["OxBtqwlTMJQ"]        |
  | 0XxI-hvPRRA          |
  smosh                | 286             | ["Comedy"]            | 194                | 20282464          | 4.489999771118164   | 80710               | 35408                | ["ut5fFyTkKv4"]        |
  | 1dmVU08zVpA          |
  NBC                  | 670             |
  ["Entertainment"]     | 165                | 16087899          | 4.789999961853027   | 30085               | 5945                 |
  ["x0dzQeq6o5Q"]        |
  | RB-wUgnyGv0          |
  ChrisInScotland      | 506             |
  ["Entertainment"]     | 159                | 15712924          | 4.78000020980835    | 8222                | 1996                 | ["RB-wUgnyGv0"]        |
  | QjA5faZF1A8          |
  guitar90             | 308             | ["Music"]             | 320                | 15256922          | 4.840000152587891   | 120506              | 38393                |
  ["O9mEKMz2Pvo"]        |
  | -_CSo1gOd48          |
  tasha                | 190             | ["People ","
  Blogs"]  | 205                | 13199833          | 3.7100000381469727  | 38045               | 9904                 |
  ["GkVBObv8TQk"]        |
  | 49IDp76kjPw          | TexMachina           | 381             | ["Comedy"]            | 59                 | 11970018          | 4.550000190734863   | 22579               | 5280                 | ["brh6KRvQHBc"]        |
  | tYnn51C3X_w          |
  CowSayingMoo         | 516             | ["Music"]             | 231                | 11823701          | 4.670000076293945   | 29479               | 10367                |
  ["zvzPK1_UkRs"]        |
  | pv5zWaTEVkI          |
  OkGo                 | 531             | ["Music"]             | 184                | 11672017          | 4.829999923706055   | 42386               | 10082                |
  ["W4WdLT6_Hz0"]        |
  | D2kJZOfq7zk          |
  mrWoot               | 199             | ["People ","
  Blogs"]  | 185                | 11184051          | 4.820000171661377   | 42162               | 10819                |
  ["wQ7h-UUT2Rs"]        |
  +----------------------+----------------------+-----------------+-----------------------+--------------------+-------------------+---------------------+---------------------+----------------------+------------------------+--+
  10 rows selected (58.238 seconds)  查询视频分类热度（播放量）TOP10
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> select
  categories,sum(views) hot_view
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> from 
  1: jdbc:hive2://hadoop207.cevent.com:10000> (
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> select
  video_id,views,categories
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  video_info 
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> lateral
  view explode(category) vtb1 as categories
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> )vtb2
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> group by
  categories
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> order by
  hot_view desc
  1:
  jdbc:hive2://hadoop207.cevent.com:10000> limit 10;
  INFO  : Number of reduce tasks
  not specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591768379763_0005
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0005/
  INFO  : Starting Job =
  job_1591768379763_0005, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0005/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591768379763_0005
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 17:34:05,334
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 17:34:20,032
  Stage-1 map = 21%,  reduce = 0%,
  Cumulative CPU 3.26 sec
  INFO  : 2020-06-10 17:34:23,171
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 4.18 sec
  INFO  : 2020-06-10 17:34:37,709
  Stage-1 map = 100%,  reduce = 100%,
  Cumulative CPU 6.23 sec
  INFO  : MapReduce Total
  cumulative CPU time: 6 seconds 230 msec
  INFO  : Ended Job =
  job_1591768379763_0005
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591768379763_0006
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0006/
  INFO  : Starting Job =
  job_1591768379763_0006, Tracking URL = http://hadoop207.cevent.com:8088/proxy/application_1591768379763_0006/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591768379763_0006
  INFO  : Hadoop job information
  for Stage-2: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 17:34:54,889
  Stage-2 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 17:35:04,185
  Stage-2 map = 100%,  reduce = 0%,
  Cumulative CPU 1.36 sec
  INFO  : 2020-06-10 17:35:13,581
  Stage-2 map = 100%,  reduce = 100%,
  Cumulative CPU 3.13 sec
  INFO  : MapReduce Total
  cumulative CPU time: 3 seconds 130 msec
  INFO  : Ended Job =
  job_1591768379763_0006
  +----------------+-------------+--+
  |  
  categories   |  hot_view  
  |
  +----------------+-------------+--+
  | Music          | 2426199511  |
  | Entertainment  | 1644510629  |
  | Comedy         | 1603337065  |
  | Film           | 659449540   |
  | 
  Animation     | 659449540   |
  | Sports         | 647412772   |
  | 
  Games         | 505658305   |
  | Gadgets        | 505658305   |
  | People         | 425607955   |
  | 
  Blogs         | 425607955   |
  +----------------+-------------+--+
  10 rows selected (86.081 seconds)
   
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> select
  categories,count(1) count_views 
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from 
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select
  video_id,categories
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from 
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select
  video_id,category,views from video_store order by views desc limit 20)
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  top1
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> lateral
  view explode(category) topclass as categories)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> top2 
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> group by
  categories; 
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0001
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0001/
  INFO  : Starting Job =
  job_1591796204991_0001, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0001/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0001
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 21:50:11,943
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 21:50:27,751
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 5.16 sec
  INFO  : 2020-06-10 21:50:39,744
  Stage-1 map = 100%,  reduce = 100%,
  Cumulative CPU 8.64 sec
  INFO  : MapReduce Total
  cumulative CPU time: 8 seconds 640 msec
  INFO  : Ended Job =
  job_1591796204991_0001
  INFO  : Number of reduce tasks not
  specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0002
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0002/
  INFO  : Starting Job =
  job_1591796204991_0002, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0002/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0002
  INFO  : Hadoop job information
  for Stage-2: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 21:50:53,760
  Stage-2 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 21:51:02,050
  Stage-2 map = 100%,  reduce = 0%,
  Cumulative CPU 1.26 sec
  INFO  : 2020-06-10 21:51:10,767
  Stage-2 map = 100%,  reduce = 100%,
  Cumulative CPU 3.1 sec
  INFO  : MapReduce Total
  cumulative CPU time: 3 seconds 100 msec
  INFO  : Ended Job =
  job_1591796204991_0002
  +----------------+--------------+--+
  |  
  categories   | count_views  |
  +----------------+--------------+--+
  | 
  Blogs         | 2            |
  | 
  UNA           | 1            |
  | Comedy         | 6            |
  | Entertainment  | 6            |
  | Music          | 5            |
  | People         | 2            |
  +----------------+--------------+--+
  6 rows selected (79.887 seconds)  热度前50类别
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> select
  categories,count(1) hot50
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  from
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select
  video_id,categories
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> distinct
  top50.video_id,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> category
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  explode(related_id) video_id
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select
  video_id,related_id,views from video_store order by views desc limit 50)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> top5)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> top50
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> left join
  video_store vs
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> on
  top50.video_id=vs.video_id)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> top50s
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  lateral view explode(category) top50sc as categories)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> tops
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> group by
  categories
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> order by
  hot50 desc;
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0003
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0003/
  INFO  : Starting Job =
  job_1591796204991_0003, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0003/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0003
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:15:13,852
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:15:26,287
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 4.82 sec
  INFO  : 2020-06-10 22:15:36,750
  Stage-1 map = 100%,  reduce = 100%,
  Cumulative CPU 7.59 sec
  INFO  : MapReduce Total
  cumulative CPU time: 7 seconds 590 msec
  INFO  : Ended Job = job_1591796204991_0003
  INFO  : Stage-9 is selected by
  condition resolver.
  INFO  : Stage-2 is filtered out
  by condition resolver.
  ERROR : Execution failed with exit status: 3
  ERROR : Obtaining error information
  ERROR : 
  Task failed!
  Task ID:
    Stage-9
   
  Logs:
   
  ERROR : /opt/module/hive-1.2.1/logs/hive.log
  INFO  : Number of reduce tasks
  not specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:2
  INFO  : Submitting tokens for
  job: job_1591796204991_0004
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0004/
  INFO  : Starting Job =
  job_1591796204991_0004, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0004/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0004
  INFO  : Hadoop job information
  for Stage-2: number of mappers: 2; number of reducers: 1
  INFO  : 2020-06-10 22:15:53,641
  Stage-2 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:16:06,730
  Stage-2 map = 50%,  reduce = 0%,
  Cumulative CPU 1.26 sec
  INFO  : 2020-06-10 22:16:09,932
  Stage-2 map = 100%,  reduce = 0%,
  Cumulative CPU 6.23 sec
  INFO  : 2020-06-10 22:16:20,255
  Stage-2 map = 100%,  reduce = 100%,
  Cumulative CPU 11.0 sec
  INFO  : MapReduce Total
  cumulative CPU time: 11 seconds 0 msec
  INFO  : Ended Job =
  job_1591796204991_0004
  INFO  : Number of reduce tasks
  not specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0005
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0005/
  INFO  : Starting Job =
  job_1591796204991_0005, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0005/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0005
  INFO  : Hadoop job information
  for Stage-3: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:16:33,666
  Stage-3 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:16:39,909
  Stage-3 map = 100%,  reduce = 0%,
  Cumulative CPU 0.87 sec
  INFO  : 2020-06-10 22:16:45,066
  Stage-3 map = 100%,  reduce = 100%,
  Cumulative CPU 2.22 sec
  INFO  : MapReduce Total
  cumulative CPU time: 2 seconds 220 msec
  INFO  : Ended Job =
  job_1591796204991_0005
  INFO  : Number of reduce tasks
  not specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0006
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0006/
  INFO  : Starting Job =
  job_1591796204991_0006, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0006/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0006
  INFO  : Hadoop job information
  for Stage-4: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:16:56,856
  Stage-4 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:17:04,043
  Stage-4 map = 100%,  reduce = 0%,
  Cumulative CPU 1.2 sec
  INFO  : 2020-06-10 22:17:10,240
  Stage-4 map = 100%,  reduce = 100%,
  Cumulative CPU 2.52 sec
  INFO  : MapReduce Total
  cumulative CPU time: 2 seconds 520 msec
  INFO  : Ended Job =
  job_1591796204991_0006
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the maximum
  number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0007
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0007/
  INFO  : Starting Job =
  job_1591796204991_0007, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0007/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0007
  INFO  : Hadoop job information
  for Stage-5: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:17:22,760
  Stage-5 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:17:31,863
  Stage-5 map = 100%,  reduce = 0%,
  Cumulative CPU 1.01 sec
  INFO  : 2020-06-10 22:17:38,056
  Stage-5 map = 100%,  reduce = 100%,
  Cumulative CPU 2.46 sec
  INFO  : MapReduce Total
  cumulative CPU time: 2 seconds 460 msec
  INFO  : Ended Job =
  job_1591796204991_0007
  +----------------+--------+--+
  |  
  categories   | hot50  |
  +----------------+--------+--+
  | Comedy         | 14     |
  | Entertainment  | 11    
  |
  | Music          | 10    
  |
  | Film           | 3      |
  | 
  Animation     | 3      |
  | People         | 2      |
  | 
  Blogs         | 2      |
  | Travel         | 1      |
  | Sports         | 1      |
  | Howto          | 1      |
  | 
  Places        | 1      |
  | 
  DIY           | 1      |
  +----------------+--------+--+
  12 rows selected (156.518 seconds)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> select categories,count(1) hot50
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select video_id,categories
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  (select
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> distinct top2.video_id,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> category
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  (select
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> explode(related_id) video_id
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> (select video_id,related_id,views
  from video_store order by views desc limit 50)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> top1)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> top2
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> left join video_store vs
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> on top2.video_id=vs.video_id)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> top3
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> lateral view explode(category)
  top50 as categories)
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  top4
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> group by categories
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> order by hot50 desc;
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0008
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0008/
  INFO  : Starting Job =
  job_1591796204991_0008, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0008/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0008
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:27:38,317
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:27:48,615
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 4.8 sec
  INFO  : 2020-06-10 22:27:57,877
  Stage-1 map = 100%,  reduce = 100%,
  Cumulative CPU 7.66 sec
  INFO  : MapReduce Total
  cumulative CPU time: 7 seconds 660 msec
  INFO  : Ended Job =
  job_1591796204991_0008
  INFO  : Stage-9 is selected by
  condition resolver.
  INFO  : Stage-2 is filtered out
  by condition resolver.
  ERROR : Execution failed with exit status: 3
  ERROR : Obtaining error information
  ERROR : 
  Task failed!
  Task ID:
    Stage-9
   
  Logs:
   
  ERROR : /opt/module/hive-1.2.1/logs/hive.log
  INFO  : Number of reduce tasks
  not specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:2
  INFO  : Submitting tokens for
  job: job_1591796204991_0009
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0009/
  INFO  : Starting Job =
  job_1591796204991_0009, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0009/
  INFO  : Kill Command = /opt/module/hadoop-2.7.2/bin/hadoop
  job  -kill job_1591796204991_0009
  INFO  : Hadoop job information
  for Stage-2: number of mappers: 2; number of reducers: 1
  INFO  : 2020-06-10 22:28:16,085
  Stage-2 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:28:27,280
  Stage-2 map = 50%,  reduce = 0%
  INFO  : 2020-06-10 22:28:32,046
  Stage-2 map = 100%,  reduce = 0%,
  Cumulative CPU 6.44 sec
  INFO  : 2020-06-10 22:28:43,275
  Stage-2 map = 100%,  reduce = 100%,
  Cumulative CPU 11.15 sec
  INFO  : MapReduce Total
  cumulative CPU time: 11 seconds 150 msec
  INFO  : Ended Job =
  job_1591796204991_0009
  INFO  : Number of reduce tasks
  not specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0010
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0010/
  INFO  : Starting Job =
  job_1591796204991_0010, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0010/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0010
  INFO  : Hadoop job information
  for Stage-3: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:28:59,537
  Stage-3 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:29:04,869
  Stage-3 map = 100%,  reduce = 0%,
  Cumulative CPU 0.99 sec
  INFO  : 2020-06-10 22:29:12,157
  Stage-3 map = 100%,  reduce = 100%,
  Cumulative CPU 2.56 sec
  INFO  : MapReduce Total
  cumulative CPU time: 2 seconds 560 msec
  INFO  : Ended Job =
  job_1591796204991_0010
  INFO  : Number of reduce tasks
  not specified. Estimated from input data size: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0011
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0011/
  INFO  : Starting Job = job_1591796204991_0011,
  Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0011/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0011
  INFO  : Hadoop job information
  for Stage-4: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:29:24,044
  Stage-4 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:29:29,179
  Stage-4 map = 100%,  reduce = 0%,
  Cumulative CPU 0.8 sec
  INFO  : 2020-06-10 22:29:36,872
  Stage-4 map = 100%,  reduce = 100%,
  Cumulative CPU 2.3 sec
  INFO  : MapReduce Total
  cumulative CPU time: 2 seconds 300 msec
  INFO  : Ended Job =
  job_1591796204991_0011
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0012
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0012/
  INFO  : Starting Job =
  job_1591796204991_0012, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0012/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0012
  INFO  : Hadoop job information
  for Stage-5: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:29:49,880
  Stage-5 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:29:58,929
  Stage-5 map = 100%,  reduce = 0%,
  Cumulative CPU 0.87 sec
  INFO  : 2020-06-10 22:30:05,100
  Stage-5 map = 100%,  reduce = 100%,
  Cumulative CPU 2.23 sec
  INFO  : MapReduce Total
  cumulative CPU time: 2 seconds 230 msec
  INFO  : Ended Job =
  job_1591796204991_0012
  +----------------+--------+--+
  |  
  categories   | hot50  |
  +----------------+--------+--+
  | Comedy         | 14     |
  | Entertainment  | 11    
  |
  | Music          | 10     |
  | Film           | 3      |
  | 
  Animation     | 3      |
  | People         | 2      |
  | 
  Blogs         | 2      |
  | Travel         | 1      |
  | Sports         | 1      |
  | Howto          | 1      |
  | 
  Places        | 1      |
  | 
  DIY           | 1      |
  +----------------+--------+--+
  12 rows selected (155.864 seconds)  创建中间表
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> create
  table video_center stored as orc as 
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> select 
  0: jdbc:hive2://hadoop207.cevent.com:10000> video_id,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> uploader,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> age,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> categories,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> length,
  0: jdbc:hive2://hadoop207.cevent.com:10000> views,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> rate,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> ratings,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> comments,
  0:
  jdbc:hive2://hadoop207.cevent.com:10000>
  related_id
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  from video_store
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> lateral
  view
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> explode(category)
  tb1 as categories;
  INFO  : Number of reduce tasks
  is set to 0 since there's no reduce operator
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0013
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0013/
  INFO  : Starting Job =
  job_1591796204991_0013, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0013/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0013
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 0
  INFO  : 2020-06-10 22:40:04,820
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:40:20,958
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 12.58 sec
  INFO  : MapReduce Total
  cumulative CPU time: 12 seconds 580 msec
  INFO  : Ended Job =
  job_1591796204991_0013
  INFO  : Stage-4 is selected by
  condition resolver.
  INFO  : Stage-3 is filtered out
  by condition resolver.
  INFO  : Stage-5 is filtered out
  by condition resolver.
  INFO  : Moving data to:
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_22-39-57_695_4121069996262157418-1/-ext-10001
  from hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_22-39-57_695_4121069996262157418-1/-ext-10003
  INFO  : Moving data to:
  hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/video_center
  from hdfs://hadoop207.cevent.com:8020/user/hive/warehouse/cevent01.db/.hive-staging_hive_2020-06-10_22-39-57_695_4121069996262157418-1/-ext-10001
  INFO  : Table
  cevent01.video_center stats: [numFiles=1, numRows=1019206,
  totalSize=25757855, rawDataSize=405083036]
  No rows affected (29.661 seconds)
  0: jdbc:hive2://hadoop207.cevent.com:10000> select video_id,views
  0: jdbc:hive2://hadoop207.cevent.com:10000> from video_center
  0: jdbc:hive2://hadoop207.cevent.com:10000> where
  categories='music'
  0: jdbc:hive2://hadoop207.cevent.com:10000> order by views desc
  0: jdbc:hive2://hadoop207.cevent.com:10000> limit 10;
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0014
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0014/
  INFO  : Starting Job =
  job_1591796204991_0014, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0014/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0014
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:42:33,022
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:42:41,367
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 3.19 sec
  INFO  : 2020-06-10 22:42:47,540
  Stage-1 map = 100%,  reduce = 100%,
  Cumulative CPU 4.46 sec
  INFO  : MapReduce Total
  cumulative CPU time: 4 seconds 460 msec
  INFO  : Ended Job =
  job_1591796204991_0014
  +-----------+--------+--+
  | video_id  | views 
  |
  +-----------+--------+--+
  +-----------+--------+--+
  No rows selected (26.279 seconds)  类别前10热度
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> select
  video_id,views
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  video_center
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> where
  categories="music"
  0: jdbc:hive2://hadoop207.cevent.com:10000>
  order by views desc
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> limit 10;
  INFO  : Number of reduce tasks
  determined at compile time: 1
  INFO  : In order to change the
  average load for a reducer (in bytes):
  INFO  :   set hive.exec.reducers.bytes.per.reducer=
  INFO  : In order to limit the
  maximum number of reducers:
  INFO  :   set hive.exec.reducers.max=
  INFO  : In order to set a
  constant number of reducers:
  INFO  :   set mapreduce.job.reduces=
  INFO  : number of splits:1
  INFO  : Submitting tokens for
  job: job_1591796204991_0015
  INFO  : The url to track the
  job: http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0015/
  INFO  : Starting Job =
  job_1591796204991_0015, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0015/
  INFO  : Kill Command =
  /opt/module/hadoop-2.7.2/bin/hadoop job 
  -kill job_1591796204991_0015
  INFO  : Hadoop job information
  for Stage-1: number of mappers: 1; number of reducers: 1
  INFO  : 2020-06-10 22:43:24,251
  Stage-1 map = 0%,  reduce = 0%
  INFO  : 2020-06-10 22:43:33,219
  Stage-1 map = 100%,  reduce = 0%,
  Cumulative CPU 2.89 sec
  INFO  : 2020-06-10 22:43:40,417
  Stage-1 map = 100%,  reduce = 100%,
  Cumulative CPU 4.05 sec
  INFO  : MapReduce Total
  cumulative CPU time: 4 seconds 50 msec
  INFO  : Ended Job =
  job_1591796204991_0015
  +-----------+--------+--+
  | video_id  | views 
  |
  +-----------+--------+--+
  +-----------+--------+--+
  No rows selected (25.851 seconds)
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> 类别前10流量
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> select
  video_id,ratings
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> from
  video_center
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> where
  categories="music"
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> order by
  ratings desc
  0:
  jdbc:hive2://hadoop207.cevent.com:10000> limit 10;
  INFO 
  : Number of reduce tasks determined at compile time: 1
  INFO 
  : In order to change the average load for a reducer (in bytes):
  INFO 
  :   set
  hive.exec.reducers.bytes.per.reducer=
  INFO 
  : In order to limit the maximum number of reducers:
  INFO 
  :   set
  hive.exec.reducers.max=
  INFO 
  : In order to set a constant number of reducers:
  INFO 
  :   set mapreduce.job.reduces=
  INFO 
  : number of splits:1
  INFO 
  : Submitting tokens for job: job_1591796204991_0016
  INFO 
  : The url to track the job:
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0016/
  INFO 
  : Starting Job = job_1591796204991_0016, Tracking URL =
  http://hadoop207.cevent.com:8088/proxy/application_1591796204991_0016/
  INFO 
  : Kill Command = /opt/module/hadoop-2.7.2/bin/hadoop job  -kill job_1591796204991_0016
  INFO 
  : Hadoop job information for Stage-1: number of mappers: 1; number of
  reducers: 1
  INFO 
  : 2020-06-10 22:47:26,998 Stage-1 map = 0%,  reduce = 0%
  INFO 
  : 2020-06-10 22:47:35,703 Stage-1 map = 100%,  reduce = 0%, Cumulative CPU 2.96 sec
  INFO 
  : 2020-06-10 22:47:43,061 Stage-1 map = 100%,  reduce = 100%, Cumulative CPU 4.18 sec
  INFO 
  : MapReduce Total cumulative CPU time: 4 seconds 180 msec
  INFO 
  : Ended Job = job_1591796204991_0016
  +-----------+----------+--+
  | video_id  | ratings 
  |
  +-----------+----------+--+
  +-----------+----------+--+
  No rows selected (24.756 seconds)

13.ETL-SQL解析




 
  
  //ETL应用
  //1)创建user外部表：
  create external table video_user_info(
  uploader string,
  videos int,
  friends int
  )
  row format delimited fields terminated by
  '\t'
  location '/cevent_video_show/user';
   
  select * from video_user_info limit 5;
   
  //2)创建video外部表
  create external table video_info(
  video_id string,
  uploader string,
  age int,
  category array<string>,
  length int,
  views int,
  rate float,
  ratings int,
  comments int,
  related_id array<string>
  )
  row format delimited fields terminated by
  '\t'
  collection items terminated by '&'
  location '/cevent_video_show/video';
   
  select * from video_info limit 5;
   
  //3)创建user内部表，将外部表数据导入内部表
  create table video_user stored as orc as
  select * from video_user_info;
  create table video_store stored as orc as
  select * from video_info;
   
  //--查询--
  //--1.统计视频观看数TOP-10
  select * from video_info order by views
  desc limit 10;
  //--2.统计视频类别热度TOP10（播放量）
  select video_id,views,categories
  from video_info 
  lateral view explode(category) vtb1 as
  categories;
   
  //假定上标是vtb1，利用lateral view explode进行分解聚合列
  select categories,sum(views) hot_view
  from 
  (
  select video_id,views,categories
  from video_info 
  lateral view explode(category) vtb1 as
  categories
  )vtb2
  group by categories
  order by hot_view desc
  limit 10;
   
  //--3.统计视频观看数最高的TOP20个视频，显示所属类别和类别包含的TOP20视频个数
  //top1显示前20视频
   select video_id,category,views from
  video_store order by views desc limit 20;
  //top1炸开类别
  select video_id,categories
  from 
  (select video_id,category,views from
  video_store order by views desc limit 20)
  top1
  lateral view explode(category) topclass
  as categories;
  //top2统计个数
  select categories,count(1) count_views 
  from 
  (select video_id,categories
  from 
  (select video_id,category,views from
  video_store order by views desc limit 20)
  top1
  lateral view explode(category) topclass
  as categories)
  top2 
  group by categories; 
   
  //--4.统计视频观看数TOP50所关联视频的所属类别排序
  //获取TOP50关联视频
  select video_id,related_id,views from
  video_store order by views desc limit 50;
  //top1炸开关联视频，一万条以内可以使用全局去重distinct，因为已经limit,但由于严格模式，不可用
  select
  explode(related_id) video_id
  from
  (select video_id,related_id,views from
  video_store order by views desc limit 50)
  top1;
  //top2关联原表，找类别
  select
  distinct top2.video_id,
  category
  from
  (select
  explode(related_id) video_id
  from
  (select video_id,related_id,views from
  video_store order by views desc limit 50)
  top1)
  top2
  left join video_store vs
  on top2.video_id=vs.video_id;
  //top3 炸开类别
  select video_id,categories
  from
  (select
  distinct top2.video_id,
  category
  from
  (select
  explode(related_id) video_id
  from
  (select video_id,related_id,views from
  video_store order by views desc limit 50)
  top1)
  top2
  left join video_store vs
  on top2.video_id=vs.video_id)
  top3
  lateral view explode(category) top50 as
  categories;
  //top4统计排名
  select categories,count(1) hot50
  from
  (select video_id,categories
  from
  (select
  distinct top2.video_id,
  category
  from
  (select
  explode(related_id) video_id
  from
  (select video_id,related_id,views from
  video_store order by views desc limit 50)
  top1)
  top2
  left join video_store vs
  on top2.video_id=vs.video_id)
  top3
  lateral view explode(category) top50 as
  categories)
  top4
  group by categories
  order by hot50 desc;
   
  //--5.统计每个类别中的视频热度TOP10，以music为例
  //创建中间表
  create table video_center stored as orc
  as 
  select 
  video_id,
  uploader,
  age,
  categories,
  length,
  views,
  rate,
  ratings,
  comments,
  related_id
  from video_store
  lateral view
  explode(category) tb1 as categories;
  //插入数据中间层
  select 
  video_id,
  uploader,
  age,
  categories,
  length,
  views,
  rate,
  ratings,
  comments,
  related_id
  from video_store
  lateral view
  explode(category) tb1 as categories;
  //t1按热度排序
  select video_id,views
  from video_center
  where categories="music"
  order by views desc
  limit 10;
   
  //--6.统计每个类别中的视频流量TOP10，以music为例
  select video_id,ratings
  from video_center
  where categories="music"
  order by ratings desc
  limit 10;

你可能感兴趣的:(hadoop,zookeeper,hive,mapreduce,hive,hadoop,mysql,linux)

一次Linux下 .net 调试经历 norsd C#VC Debug linux .net
背景：Xt160Api,之前在windows下用.net调用，没有任何问题。但是移植到Linux去后，.net程序调用init(config_path)总是报错/root/test找不到traderApi.ini(/root/test是程序目录)然后退出程序解决过程:于是考虑是不是参数传错了，但是无论这个参数是什么，报错内容始终如此。甚至某些情况下，比如加了几句Console.WriteLIne(
MySQL---DDL（3.17）秋凉づᐇ mysql oracle 数据库
1、DDL-数据库操作查询：查询所有数据库：SHOWDATABASES;查询当前数据库：SELECTDATABASE();创建:CREATEDATABASE[IFNOTEXISTS]数据库名[DEFAULTCHARSET字符集][COLLATE排序规则]；删除：DROPDATABASE[IFEXISTS]数据库名；使用：USE数据库名；2、DDL--表操作-查询查询当前数据库所有表：SHOWTAB
音频 Alsa、Framework及Android ‘禹’你一起后端
目录1Alsa、Framework及Android1.1ALSA架构简介图11.2ALSA架构简介图21.3ALSA架构简介图31.4ALSA架构简介图41.5ALSA架构简介图51.6ALSA架构简介图61.8音频代码1Alsa、Framework及Android目前，linux系统常用的音频驱动有两种形式:alsa和oss。Alsa：现在是linux下音频驱动的主要形式，与简单的oss兼容。o
linux系统命令——权限 why—空空 linux 服务器运维
一、有哪些权限读（r）——对应数字4写（w）——对应数字2执行（x）——对应数字1二、权限及数字的对应4对应r--2对应-w-1对应--x5对应r-x6对应rw-7对应rwx三、文件的基本属性如图：①中如果是"一"表示文件类型为文件；如果是"d"表示文件类型是文件夹；如果是"l"表示文件类型为链接②表示文件属主(即谁创建的文件)的权限③中表示文件属主所属组(即文件属主所在的组)中的用户的权限④表示
Linux如何查询文件及文件夹大小大数据侠客操作系统相关 linux
查看当前目录下各文件、文件夹的大小，这个比较实用du-h-max-depth=1*查询当前目录总大小du-sh3.最大文件夹倒叙和正序du-s*|sort-rn从小到大按字节排序du-sh*sort-n从小到大按字节和M排序4.最大文件夹倒排前10和后10du-sh*|sort-rn|head前面10个du-sh*|sort-rn|tail后面10个
linux sed命令 weifexie Linux linux 运维服务器 sed awk
linuxsed命令作为三剑客的一员，也是到了不得不写写总结的时候了，按惯例，先给出出处，首当齐冲wikihttps://zh.wikipedia.org/wiki/Sedsed（意为流编辑器，源自英语“streameditor”的缩写）是一个使用简单紧凑的编程语言来解析和转换文本Unix实用程序。sed是最早支持正则表达式的工具之一，至今仍然用于文本处理，特别是用于替换命令。用于纯文本字符串操作
【versal】【petalinux】添加LED驱动 qq2108462953 petalinux linux 运维服务器
versal添加LED驱动`提示：本文使用外部kernel与uboot`一、LED1.1LED功能1.2LED节点1.3LED操作命令1.3.1点LED1.3.2关闭LED二、LED驱动2.1驱动文件2.2设备树兼容属性三、LED设备树配置3.1设备树配置信息3.2设备树配置信息讲解四、提示4.1正确4.2错误4.3提示：本文使用外部kernel与uboot一、LED1.1LED功能向节点中bri
如何在Linux中切换用户？对许 Linux linux 服务器
Linux切换用户在Linux系统中，切换用户可以通过使用su命令和sudo命令实现1、su命令su是switchuser的缩写，用于切换到另一个用户。su命令的语法如下：su[选项][用户名]以下是一些示例：#切换到root用户su-#切换到指定普通用户suetl值得注意的是，默认情况下，切换到root用户需要输入root的密码；切换到其他普通用户时，需要输入该用户的密码2、sudo命令sudo
在 CentOS 7 上安装 PHP 7.3 wjf63000 centos php linux
在CentOS7上安装PHP7.3可以按照以下步骤进行操作：1.安装必要的依赖和EPEL仓库EPEL（ExtraPackagesforEnterpriseLinux）是为企业级Linux提供额外软件包的仓库，yum-utils用于管理yum仓库。sudoyuminstall-yepel-releaseyum-utils2.添加Remi仓库Remi仓库包含了丰富的PHP版本，你可以从中选择PHP7.
linux启动db2的命令窗口_linux下如何启动db2数据库命令窗口少学汉 linux启动db2的命令窗口
在Linuxx86上安装Oracle数据库10g(来自ORACLE网)原文出处：http://www.oracle.com/technology/global/cn/pub/articles/smiley_10gdb_install.htmlDBA：Linux在Linuxx86上安装Oracle数据库10g作者：JohnSmiley学习...文章wangccsy2006-01-16562浏览量带你
Linux----网络tcp编程 weixin_51790712 linux 网络 tcp/ip
网络编程编程linux操作系统[用户空间]应用层//程序员实现------------------------------------------------------[内核空间]传输层[网络协议栈]//内核已经实现好的属于网络功能网络层数据链路层物理层程序发送数据系统调用---通过系统调用来使用操作系统提供的网络功能函数接口---socketsocket:1.操作系统提供的函数接口//通过这个
Spark任务读取hive表数据导入es 小小小小小小小小小小码农 hive elasticsearch spark java
使用elasticsearch-hadoop将hive表数据导入es，超级简单1.引入pomorg.elasticsearchelasticsearch-hadoop9.0.0-SNAPSHOT2.创建sparkconf//spark参数设置SparkConfsparkConf=newSparkConf();//要写入的索引sparkConf.set("es.resource","");//es集
Python软件和搭建运行环境办公小百知软件技术 python 开发语言
目录一、Python安装全流程（Windows/Mac/Linux）1.下载官方安装包2.详细安装步骤（以Windows为例）3.环境变量配置（Mac/Linux）二、虚拟环境管理（关键！）为什么需要虚拟环境？1.使用venv（Python内置）2.使用conda（推荐数据科学方向）三、开发工具推荐与配置1.IDE选择2.VSCode配置指南四、常见问题解决方案1.python命令无效？2.pip
nodejs+mysql分页查询 m0_67987829 mysql 前端 node.js
router:（参数page,size）goodsRouter.get("/getList",getGoodsList)controllerasyncgetGoodsList(ctx,next){const{page,size}=ctx.query;//获取查询参数//将page和size转换为数字类型constparsedPage=parseInt(page);constparsedSize=p
sequelize + Nodejs + MySQL 的简单用法小公鸡卡哇伊呀~ mysql 数据库
HowtoUseSequelizeORMinNodeJS-Tutorial1Sequlize简介Sequelize是最流行的可以与Nodejs一起使用的一种关系数据库ORM(Object-relationalmapping对象关系映射)，Mongoose是MongoDB的ORM.Sequelize的作用，简单地说，就是避免在代码里写原生SQL语句，而是将这种语句改成JavaScript：不必再写类
MySQL0基础概念4 wqx951 mysql sql
MySQL体系结构概述1.MySQL系统的重要组件包括连接管理器、线程管理器、命令分发器。2.连接管理器负责接收用户请求，转交给线程管理器，验证用户访问。3.用户请求包括查询命令，这些命令由命令分发器处理，如交友、缓存、解析结果或记录用户行为。MySQL查询处理流程1.查询处理流程包括高速缓存查询、词法分析、语法分析、结果缓存检查和分析后结果处理。2.如果查询结果在缓存中，直接返回缓存结果；否则，
基于oracle linux的 DBI/DBD 标准化安装文档(四) linux
一、安装DBIDBI(DatabaseInterface)是perl连接数据库的接口。其是perl连接数据库的最优方法，他支持包括Orcale,Sybase,mysql,db2等绝大多数的数据库，下面将简要介绍其安装方法。1.1解压tar-zxvfDBI-1.616_901.tar.gz1.2安装依赖yuminstallperl-ExtUtils-CBuilderperl-ExtUtils-Mak
mysql中json数组对象mybatis如何自动映射
需求:假如数据库某个表的一个字段是json数据类型,字段名是students,类型是,存的是json格式的学生数组,现要用一个List来接收,如何实现自动转换.1.实现TypeHandlerwhy?如果json字段存的是数组,直接使用"com.baomidou.mybatisplus.extension.handlers.FastjsonTypeHandler"会给你转成List类型;所以需要自己
wordpress导入mysql数据库文件的方法及注意事项 wodrpress资源分享 wordpress 数据库 mysql wordpress
WordPress是一个流行的开源内容管理系统，通常用于构建网站和博客。它使用MySQL数据库来存储和管理网站数据。在某些情况下，您可能需要将现有的MySQL数据库导入到新的WordPress安装中。本文将介绍如何导入MySQL数据库文件到WordPress以及需要注意的事项。一、备份现有数据库在进行任何数据库导入操作之前，强烈建议您先备份现有的数据库。这样可以确保在导入过程中出现问题时，您不会丢
CURL一文通 calmtho curl 网络
文章目录1.什么是curl2.curl可以发送什么请求3.常见curl发http相关请求怎么写4.curl带上的参数分别有什么，可以怎么用5.进阶用法6.常见错误以及学习指导建议1.什么是curl是利用URL语法在命令行下工作的开源文件传输工具。尤其被广泛应用的在linux系统下。2.curl可以发送什么请求由定义可知道，curl主要应用于网络传输，它支持常用的多种请求，如http,https,f
doris:认证与鉴权概述向阳1218 大数据 doris
Doris的权限管理系统参照了MySQL的权限管理机制，做到了行级别细粒度的权限控制，基于角色的权限访问控制，并且支持白名单机制。名词解释用户标识UserIdentity在权限系统中，一个用户被识别为一个UserIdentity（用户标识）。用户标识由两部分组成：username和host。其中username为用户名，由英文大小写组成。host表示该用户链接来自的IP。UserIdentity以
【go从入门到精通】探秘struct结构体转json为什么需要首字母大写？前网易架构师-高司机 golang从入门到精通 golang json go 结构体首字母大写 golang从入门到精通 go从入门到精通
目录作者简介：问题抛出分析结论作者简介：高科，先后在IBMPlatformComputing从事网格计算，淘米网，网易从事游戏服务器开发，拥有丰富的C++，go等语言开发经验，mysql，mongo，redis等数据库，设计模式和网络库开发经验，对战棋类，回合制，moba类页游，手游有丰富的架构设计和开发经验。并且深耕深度学习和数据集训练，提供商业化的视觉人工智能检测和预警系统（煤矿，工厂，制造业
Linux arm64架构修改软件apt\yum源（统信UOS，麒麟kylin系统修改阿里源、华为源）国产系统UOS修改apt源 longerxin2020 linux
本文参考链接Linuxarm64架构修改软件源（统信UOS，麒麟系统修改阿里源、华为源）国产系统UOS修改apt源_uos如何快速换源-CSDN博客本文介绍华为arm架构主机使用国内源配置1.备份系统之前的源cp/etc/apt/sources.list/etc/apt/sources.list.bak2.修改源文件/etc/apt/sources.listvim/etc/apt/sources.
Linux将剩余空间分配给根目录 longerxin2020 Linux linux 运维服务器
要将剩余的100GB空间扩展到根目录（/），你需要执行以下步骤。这些步骤包括调整LVM逻辑卷和文件系统。1.检查当前的磁盘和分区首先，确认当前的磁盘和分区布局。lsblk2.检查LVM物理卷、卷组和逻辑卷使用pvs、vgs和lvs命令来查看当前的LVM配置。pvsvgslvs3.扩展物理卷假设vda3的剩余空间还没有被分配给任何分区，你需要使用pvresize命令来扩展物理卷。sudopvresi
linux下使用curl访问多参数url 耘田 Linux curl linux url 多参数
curl-ihttp://marsoffset.goforandroid.com/GoSmsMarService/abc?a=116.397428&b=39.90923[1]8741[jb-xccheng@usa-ip-12~]$HTTP/1.1500InternalServerErrorServer:nginx/1.2.0Date:Wed,20Jun201204:16:21GMTContent-
ubuntu 24.10安装mysql linuxxx110 ubuntu mysql
1.更新软件包列表在安装MySQL之前，先更新系统的软件包列表sudoaptupdate2、安装MySQL服务器sudoaptinstallmysql-server3.启动MySQL服务sudosystemctlstatusmysql4、运行安全脚本MySQL提供了一个安全脚本，用于设置root密码、移除匿名用户、禁止远程root登录等。运行以下命令sudomysql_secure_install
SQLite？低调不是小众... 架构文摘JGWZ sqlite 数据库学习后端
前几天在一个群里看到一位同学说：“SQLite这么小众的数据库，到底是什么人在用啊？”首先要说的是SQLite可不是小众的数据库，相反，SQLite是世界上装机量最多的数据库，远超MySQL，只不过比较低调而已。低调到我想在官网上找一个好看的用来当插图的图片都找不到，只能截一张官网首页来撑一撑，看起来十分朴素。我最早听说SQLite是刚毕业工作的时候，我们部门做微软内容管理产品的二次开发，其中有一
Redis 安装详细教程（小白版）小小鸭程序员 spring java AI编程 spring cloud redis
一、Windows系统安装Redis方法1：直接安装（推荐新手）下载RedisforWindows访问微软维护的Redis版本：https://github.com/microsoftarchive/redis/releases下载Redis-x64-3.2.100.msi（或最新版本）安装包。安装Redis双击下载的.msi文件点击下一步，勾选“AddRedisinstallationfolde
docker mysql 迁移_Docker跨服务器迁移 weixin_39687468 docker mysql 迁移
Docker跨服务器迁移Docker的备份方式有export和save两种。export是当前的状态，针对的是容器，dockersave是针对镜像images。一、镜像的迁移—save1.镜像保存登陆到已经部署好镜像的服务器上面，执行以下命令进行导出[root@snowedfiles_backup]#dockersave97fd>docker-image-mysql-5.6.40.tar2.将镜像
mysql迁移docker_docker迁入迁出mysql 困困斐 mysql迁移docker
docker迁出mysql数据库测试环境：docker服务器mysql服务器IP192.168.163.19192.168.163.16操作系统CentOS7.8CentOS7.8docker版本Docker18.09.9/数据库版本MySQL8.0.22MySQL8.0.221.查看docker相关情况[root@docker-test/data/mysql/data]$dockerps启动my
ViewController添加button按钮解析。（翻译）张亚雄 c
<div class="it610-blog-content-contain" style="font-size: 14px"></div>// ViewController.m // Reservation software // // Created by 张亚雄 on 15/6/2.
mongoDB 简单的增删改查开窍的石头 mongodb
在上一篇文章中我们已经讲了mongodb怎么安装和数据库/表的创建。在这里我们讲mongoDB的数据库操作在mongo中对于不存在的表当你用db.表名他会自动统计下边用到的user是表明，db代表的是数据库添加(insert):
log4j配置 0624chenhong log4j
1) 新建java项目 2) 导入jar包，项目右击，properties—java build path—libraries—Add External jar，加入log4j.jar包。 3) 新建一个类com.hand.Log4jTest package com.hand; import org.apache.log4j.Logger; public class
多点触摸(图片缩放为例) 不懂事的小屁孩多点触摸
多点触摸的事件跟单点是大同小异的，上个图片缩放的代码，供大家参考一下 import android.app.Activity; import android.os.Bundle; import android.view.MotionEvent; import android.view.View; import android.view.View.OnTouchListener
有关浏览器窗口宽度高度几个值的解析换个号韩国红果果 JavaScript html
1 元素的 offsetWidth 包括border padding content 整体的宽度。 clientWidth 只包括内容区 padding 不包括border。 clientLeft = offsetWidth -clientWidth 即这个元素border的值 offsetLeft 若无已定位的包裹元素
数据库产品巡礼：IBM DB2概览蓝儿唯美 db2
IBM DB2是一个支持了NoSQL功能的关系数据库管理系统，其包含了对XML，图像存储和Java脚本对象表示（JSON）的支持。DB2可被各种类型的企业使用，它提供了一个数据平台，同时支持事务和分析操作，通过提供持续的数据流来保持事务工作流和分析操作的高效性。 DB2支持的操作系统 DB2可应用于以下三个主要的平台: 工作站，DB2可在Linus、Unix、Windo
java笔记5 a-john java
控制执行流程： 1，true和false 利用条件表达式的真或假来决定执行路径。例：（a==b）。它利用条件操作符“==”来判断a值是否等于b值，返回true或false。java不允许我们将一个数字作为布尔值使用，虽然这在C和C++里是允许的。如果想在布尔测试中使用一个非布尔值，那么首先必须用一个条件表达式将其转化成布尔值，例如if(a!=0)。 2，if-els
Web开发常用手册汇总 aijuans PHP
一门技术，如果没有好的参考手册指导,很难普及大众。这其实就是为什么很多技术，非常好，却得不到普遍运用的原因。正如我们学习一门技术，过程大概是这个样子： ①我们日常工作中，遇到了问题，困难。寻找解决方案，即寻找新的技术； ②为什么要学习这门技术？这门技术是不是很好的解决了我们遇到的难题，困惑。这个问题，非常重要，我们不是为了学习技术而学习技术，而是为了更好的处理我们遇到的问题，才需要学习新的
今天帮助人解决的一个sql问题 asialee sql
今天有个人问了一个问题，如下： type AD value A
意图对象传递数据百合不是茶 android 意图Intent Bundle对象数据的传递
学习意图将数据传递给目标活动; 初学者需要好好研究的 1,将下面的代码添加到main.xml中 <?xml version="1.0" encoding="utf-8"?> <LinearLayout xmlns:android="http:/
oracle查询锁表解锁语句 bijian1013 oracle object session kill
一.查询锁定的表如下语句，都可以查询锁定的表语句一： select a.sid, a.serial#, p.spid, c.object_name, b.session_id, b.oracle_username, b.os_user_name from v$process p, v$s
mac osx 10.10 下安装 mysql 5.6 二进制文件［tar.gz］征客丶 mysql osx
场景：在 mac osx 10.10 下安装 mysql 5.6 的二进制文件。环境：mac osx 10.10、mysql 5.6 的二进制文件步骤：[所有目录请从根“/”目录开始取，以免层级弄错导致找不到目录] 1、下载 mysql 5.6 的二进制文件，下载目录下面称之为 mysql5.6SourceDir；下载地址：http://dev.mysql.com/downl
分布式系统与框架 bit1129 分布式
RPC框架 Dubbo 什么是Dubbo Dubbo是一个分布式服务框架，致力于提供高性能和透明化的RPC远程服务调用方案，以及SOA服务治理方案。其核心部分包含: 远程通讯: 提供对多种基于长连接的NIO框架抽象封装，包括多种线程模型，序列化，以及“请求-响应”模式的信息交换方式。集群容错: 提供基于接
那些令人蛋痛的专业术语白糖_ spring Web SSO IOC
spring 【控制反转(IOC)/依赖注入(DI)】：由容器控制程序之间的关系，而非传统实现中，由程序代码直接操控。这也就是所谓“控制反转”的概念所在：控制权由应用代码中转到了外部容器，控制权的转移，是所谓反转。简单的说：对象的创建又容器(比如spring容器)来执行，程序里不直接new对象。 Web 【单点登录(SSO)】：SSO的定义是在多个应用系统中，用户
《给大忙人看的java8》摘抄 braveCS java8
函数式接口：只包含一个抽象方法的接口 lambda表达式：是一段可以传递的代码你最好将一个lambda表达式想象成一个函数，而不是一个对象，并记住它可以被转换为一个函数式接口。事实上，函数式接口的转换是你在Java中使用lambda表达式能做的唯一一件事。方法引用：又是要传递给其他代码的操作已经有实现的方法了，这时可以使
编程之美-计算字符串的相似度 bylijinnan java 算法编程之美
public class StringDistance { /** * 编程之美计算字符串的相似度 * 我们定义一套操作方法来把两个不相同的字符串变得相同，具体的操作方法为： * 1.修改一个字符（如把“a”替换为“b”）; * 2.增加一个字符（如把“abdd”变为“aebdd”）; * 3.删除一个字符（如把“travelling”变为“trav
上传、下载压缩图片 chengxuyuancsdn 下载
/** * * @param uploadImage --本地路径(tomacat路径) * @param serverDir --服务器路径 * @param imageType --文件或图片类型 * 此方法可以上传文件或图片.txt,.jpg,.gif等 */ public void upload(String uploadImage,Str
bellman-ford(贝尔曼-福特)算法 comsci 算法 F#
Bellman-Ford算法(根据发明者 Richard Bellman 和 Lester Ford 命名)是求解单源最短路径问题的一种算法。单源点的最短路径问题是指：给定一个加权有向图G和源点s，对于图G中的任意一点v，求从s到v的最短路径。有时候这种算法也被称为 Moore-Bellman-Ford 算法，因为 Edward F. Moore zu 也为这个算法的发展做出了贡献。与迪科
oracle ASM中ASM_POWER_LIMIT参数 daizj ASM oracle ASM_POWER_LIMIT 磁盘平衡
ASM_POWER_LIMIT 该初始化参数用于指定ASM例程平衡磁盘所用的最大权值，其数值范围为0~11，默认值为1。该初始化参数是动态参数，可以使用ALTER SESSION或ALTER SYSTEM命令进行修改。示例如下： SQL>ALTER SESSION SET Asm_power_limit=2;
高级排序:快速排序 dieslrae 快速排序
public void quickSort(int[] array){ this.quickSort(array, 0, array.length - 1); } public void quickSort(int[] array,int left,int right){ if(right - left <= 0
C语言学习六指针_何谓变量的地址一个指针变量到底占几个字节 dcj3sjt126com C语言
# include <stdio.h> int main(void) { /* 1、一个变量的地址只用第一个字节表示 2、虽然他只使用了第一个字节表示，但是他本身指针变量类型就可以确定出他指向的指针变量占几个字节了 3、他都只存了第一个字节地址，为什么只需要存一个字节的地址，却占了4个字节，虽然只有一个字节，但是这些字节比较多，所以编号就比较大，
phpize使用方法 dcj3sjt126com PHP
phpize是用来扩展php扩展模块的，通过phpize可以建立php的外挂模块,下面介绍一个它的使用方法,需要的朋友可以参考下安装（fastcgi模式）的时候，常常有这样一句命令：代码如下: /usr/local/webserver/php/bin/phpize 一、phpize是干嘛的？ phpize是什么？ phpize是用来扩展php扩展模块的，通过phpi
Java虚拟机学习 - 对象引用强度 shuizhaosi888 JAVA虚拟机
本文原文链接：http://blog.csdn.net/java2000_wl/article/details/8090276 转载请注明出处！无论是通过计数算法判断对象的引用数量，还是通过根搜索算法判断对象引用链是否可达，判定对象是否存活都与“引用”相关。引用主要分为：强引用(Strong Reference)、软引用(Soft Reference)、弱引用(Wea
.NET Framework 3.5 Service Pack 1（完整软件包）下载地址 happyqing .net 下载 framework
Microsoft .NET Framework 3.5 Service Pack 1（完整软件包） http://www.microsoft.com/zh-cn/download/details.aspx?id=25150 Microsoft .NET Framework 3.5 Service Pack 1 是一个累积更新，包含很多基于 .NET Framewo
JAVA定时器的使用 jingjing0907 java timer 线程定时器
1、在应用开发中，经常需要一些周期性的操作，比如每5分钟执行某一操作等。对于这样的操作最方便、高效的实现方式就是使用java.util.Timer工具类。 privatejava.util.Timer timer; timer = newTimer(true); timer.schedule( newjava.util.TimerTask() { public void run()
Webbench 流浪鱼 webbench
首页下载地址 http://home.tiscali.cz/~cz210552/webbench.html Webbench是知名的网站压力测试工具，它是由Lionbridge公司（http://www.lionbridge.com）开发。 Webbench能测试处在相同硬件上，不同服务的性能以及不同硬件上同一个服务的运行状况。webbench的标准测试可以向我们展示服务器的两项内容：每秒钟相
第11章动画效果（中） onestopweb 动画
index.html <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/
windows下制作bat启动脚本. sanyecao2314 java cmd 脚本 bat
java -classpath C:\dwjj\commons-dbcp.jar;C:\dwjj\commons-pool.jar;C:\dwjj\log4j-1.2.16.jar;C:\dwjj\poi-3.9-20121203.jar;C:\dwjj\sqljdbc4.jar;C:\dwjj\voucherimp.jar com.citsamex.core.startup.MainStart
Java进行RSA加解密的例子 tomcat_oracle java
加密是保证数据安全的手段之一。加密是将纯文本数据转换为难以理解的密文；解密是将密文转换回纯文本。　　数据的加解密属于密码学的范畴。通常，加密和解密都需要使用一些秘密信息，这些秘密信息叫做密钥，将纯文本转为密文或者转回的时候都要用到这些密钥。　　对称加密指的是发送者和接收者共用同一个密钥的加解密方法。　　非对称加密(又称公钥加密)指的是需要一个私有密钥一个公开密钥，两个不同的密钥的
Android_ViewStub 阿尔萨斯 ViewStub
public final class ViewStub extends View java.lang.Object android.view.View android.view.ViewStub 类摘要： ViewStub 是一个隐藏的，不占用内存空间的视图对象，它可以在运行时延迟加载布局资源文件。当 ViewSt