========================================================================================================================================================================================================================================================================
1.2复合指标统计分析
--统计今日所有来访者平均请求的页面数。
--平均每个独立访客一天内访问网站的次数(产生的session个数)。
========================================================================================================================================================================================================================================================================
--需求描述:统计今日所有来访者平均请求的页面数。
--总页面请求数pv/去重总人数uv
drop table dw_avgpv_user_everyday;
desc dw_avgpv_user_everyday;
create table dw_avgpv_user_everyday(day string,avgv string);
---:方式一(统计今日所有来访者平均请求的页面数。)
select * from dw_webflow_basic_info;
+------------------------------+----------------------------+---------------------------+---------------------------+---------------------------+---------------------------+--------------------------------+--+
| dw_webflow_basic_info.month | dw_webflow_basic_info.day | dw_webflow_basic_info.pv | dw_webflow_basic_info.uv | dw_webflow_basic_info.ip | dw_webflow_basic_info.vv | dw_webflow_basic_info.datestr |
+------------------------------+----------------------------+---------------------------+---------------------------+---------------------------+---------------------------+--------------------------------+--+
| 201811 | 01 | 27540 | 1027 | 1027 | 57 | 20181101 |
+------------------------------+----------------------------+---------------------------+---------------------------+---------------------------+---------------------------+--------------------------------+--+
select pv/uv as avgv from dw_webflow_basic_info;
+---------------------+--+
| avgv |
+---------------------+--+
| 26.815968841285297 |
+---------------------+--+
---:方式二 (统计今日所有来访者平均请求的页面数。)
select * from dw_weblog_detail limit 5;
+-------------------------+-------------------------------+-------------------------------+------------------------------+--------------------------+---------------------------+-------------------------+-----------------------+------------------------+-----------------------------------------------+--------------------------+-----------------------------------+--------------------------------+----------------------------+----------------------------+-----------------------------+--------------------------------+-----------------------------------+---------------------------+--+
| dw_weblog_detail.valid | dw_weblog_detail.remote_addr | dw_weblog_detail.remote_user | dw_weblog_detail.time_local | dw_weblog_detail.daystr | dw_weblog_detail.timestr | dw_weblog_detail.month | dw_weblog_detail.day | dw_weblog_detail.hour | dw_weblog_detail.request | dw_weblog_detail.status | dw_weblog_detail.body_bytes_sent | dw_weblog_detail.http_referer | dw_weblog_detail.ref_host | dw_weblog_detail.ref_path | dw_weblog_detail.ref_query | dw_weblog_detail.ref_query_id | dw_weblog_detail.http_user_agent | dw_weblog_detail.datestr |
+-------------------------+-------------------------------+-------------------------------+------------------------------+--------------------------+---------------------------+-------------------------+-----------------------+------------------------+-----------------------------------------------+--------------------------+-----------------------------------+--------------------------------+----------------------------+----------------------------+-----------------------------+--------------------------------+-----------------------------------+---------------------------+--+
| false | 194.237.142.21 | - | 2018-11-01 06:49:18 | 2018-11-01 | 06:49:18 | 11 | 01 | 06 | /wp-content/uploads/2013/07/rstudio-git3.png | 304 | 0 | "-" | NULL | NULL | NULL | NULL | "Mozilla/4.0(compatible;)" | 20181101 |
| false | 163.177.71.12 | - | 2018-11-01 06:49:33 | 2018-11-01 | 06:49:33 | 11 | 01 | 06 | / | 200 | 20 | "-" | NULL | NULL | NULL | NULL | "DNSPod-Monitor/1.0" | 20181101 |
| false | 163.177.71.12 | - | 2018-11-01 06:49:36 | 2018-11-01 | 06:49:36 | 11 | 01 | 06 | / | 200 | 20 | "-" | NULL | NULL | NULL | NULL | "DNSPod-Monitor/1.0" | 20181101 |
| false | 101.226.68.137 | - | 2018-11-01 06:49:42 | 2018-11-01 | 06:49:42 | 11 | 01 | 06 | / | 200 | 20 | "-" | NULL | NULL | NULL | NULL | "DNSPod-Monitor/1.0" | 20181101 |
| false | 101.226.68.137 | - | 2018-11-01 06:49:45 | 2018-11-01 | 06:49:45 | 11 | 01 | 06 | / | 200 | 20 | "-" | NULL | NULL | NULL | NULL | "DNSPod-Monitor/1.0" | 20181101 |
+-------------------------+-------------------------------+-------------------------------+------------------------------+--------------------------+---------------------------+-------------------------+-----------------------+------------------------+-----------------------------------------------+--------------------------+-----------------------------------+--------------------------------+----------------------------+----------------------------+-----------------------------+--------------------------------+-----------------------------------+---------------------------+--+
select remote_addr,count(*) as pvs
from dw_weblog_detail
where datestr='20181101'
group by remote_addr limit 5;
+----------------+------+--+
| remote_addr | pvs |
+----------------+------+--+
| 1.162.203.134 | 2 |
| 1.202.186.37 | 70 |
| 1.202.222.147 | 2 |
| 1.202.70.78 | 2 |
| 1.206.126.5 | 68 |
+----------------+------+--+
select '20181101', sum(b.pvs)/count(b.remote_addr) from
(select remote_addr,count(*) as pvs
from dw_weblog_detail
where datestr='20181101'
group by remote_addr) b;
+-----------+---------------------+--+
| _c0 | _c1 |
+-----------+---------------------+--+
| 20181101 | 26.815968841285297 |
+-----------+---------------------+--+
insert into table dw_avgpv_user_everyday
select '20181101', sum(b.pvs)/count(b.remote_addr) from
(select remote_addr,count(*) as pvs
from dw_weblog_detail
where datestr='20181101'
group by remote_addr) b;
select * from dw_avgpv_user_everyday limit 5;
+-----------------------------+------------------------------+--+
| dw_avgpv_user_everyday.day | dw_avgpv_user_everyday.avgv |
+-----------------------------+------------------------------+--+
| 20181101 | 26.815968841285297 |
+-----------------------------+------------------------------+--+
平均访问频度(Average Access Frequency)
--平均每个独立访客一天内访问网站的次数(产生的session个数)。
--计算方式:访问次数vv/独立访客数uv
方式一:表(dw_webflow_basic_info)--平均每个独立访客一天内访问网站的次数(产生的session个数)。
select * from dw_webflow_basic_info;
+------------------------------+----------------------------+---------------------------+---------------------------+---------------------------+---------------------------+--------------------------------+--+
| dw_webflow_basic_info.month | dw_webflow_basic_info.day | dw_webflow_basic_info.pv | dw_webflow_basic_info.uv | dw_webflow_basic_info.ip | dw_webflow_basic_info.vv | dw_webflow_basic_info.datestr |
+------------------------------+----------------------------+---------------------------+---------------------------+---------------------------+---------------------------+--------------------------------+--+
| 201811 | 01 | 27540 | 1027 | 1027 | 57 | 20181101 |
+------------------------------+----------------------------+---------------------------+---------------------------+---------------------------+---------------------------+--------------------------------+--+
--注意vv的计算采用的是点击流模型表数据 已经去除无效数据
select vv/uv as Average_access_frequency
from dw_webflow_basic_info; (陈燕龙疑问)
+---------------------------+--+
| average_access_frequency |
+---------------------------+--+
| 0.055501460564751706 |
+---------------------------+--+
方式二:表(ods_click_stream_visit)--平均每个独立访客一天内访问网站的次数(产生的session个数)。
--ods_click_pageviews
--ods_click_stream_visit
select * from ods_click_stream_visit limit 10;
+---------------------------------------+-------------------------------------+--------------------------------+---------------------------------+--------------------------------+---------------------------------+----------------------------------------------------+------------------------------------+---------------------------------+--+
| ods_click_stream_visit.session | ods_click_stream_visit.remote_addr | ods_click_stream_visit.intime | ods_click_stream_visit.outtime | ods_click_stream_visit.inpage | ods_click_stream_visit.outpage | ods_click_stream_visit.referal | ods_click_stream_visit.pagevisits | ods_click_stream_visit.datestr |
+---------------------------------------+-------------------------------------+--------------------------------+---------------------------------+--------------------------------+---------------------------------+----------------------------------------------------+------------------------------------+---------------------------------+--+
| 005fd135-d9ec-4ac2-ba16-706004359d42 | 195.110.138.105 | 2018-11-01 19:10:52 | 2018-11-01 19:10:52 | /cassandra-clustor/ | /cassandra-clustor/ | "https://www.google.com.tw/" | 1 | 20181101 |
| 00a9e4d8-dfb2-4d32-b180-eb2383112317 | 66.249.66.84 | 2018-11-01 07:44:41 | 2018-11-01 07:44:41 | /finance-rhive-repurchase/ | /finance-rhive-repurchase/ | "-" | 1 | 20181101 |
| 0173589c-2fbb-4d60-ad65-44d7468ec0ab | 159.226.251.170 | 2018-11-01 08:26:18 | 2018-11-01 08:26:18 | /hadoop-mahout-roadmap/ | /hadoop-mahout-roadmap/ | "http://f.dataguru.cn/thread-177375-1-1.html" | 1 | 20181101 |
| 065d5e7a-d7fe-45a3-b7b4-a5f053ecc4ab | 221.179.193.202 | 2018-11-02 00:44:07 | 2018-11-02 00:44:07 | /hadoop-mahout-roadmap/ | /hadoop-mahout-roadmap/ | "-" | 1 | 20181101 |
| 14c9ea27-dd75-476e-bea4-7f01d9ee4953 | 218.18.232.228 | 2018-11-01 09:53:55 | 2018-11-01 09:53:55 | /hadoop-family-roadmap/ | /hadoop-family-roadmap/ | "https://www.google.com.hk/" | 1 | 20181101 |
| 165938d8-2c27-4c57-b1e7-613a28d2f1d6 | 113.90.48.158 | 2018-11-01 23:19:41 | 2018-11-01 23:19:41 | /finance-rhive-repurchase/ | /finance-rhive-repurchase/ | "http://blog.fens.me/series-it-finance/" | 1 | 20181101 |
| 1784f12d-0b49-4c0e-b7e4-93dc39883091 | 123.116.73.157 | 2018-11-02 00:58:58 | 2018-11-02 00:58:58 | /hadoop-zookeeper-intro/ | /hadoop-zookeeper-intro/ | "https://www.google.com.hk/" | 1 | 20181101 |
| 182549fa-aca2-49ea-88ce-6aa238bbf1dd | 110.211.10.14 | 2018-11-01 13:31:10 | 2018-11-01 13:31:10 | /hadoop-mahout-roadmap/ | /hadoop-mahout-roadmap/ | "http://f.dataguru.cn/forum.php?mod=viewthread&tid=175501" | 1 | 20181101 |
| 1ba35571-d9c0-4b26-bcd0-4999e395ae7f | 183.60.9.217 | 2018-11-01 07:10:57 | 2018-11-01 07:10:57 | /hadoop-hive-intro/ | /hadoop-hive-intro/ | "-" | 1 | 20181101 |
| 1d5dec98-637b-45f1-9ada-58ae4fff7a9b | 112.65.193.16 | 2018-11-01 08:48:31 | 2018-11-01 08:48:31 | /hadoop-mahout-roadmap/ | /hadoop-mahout-roadmap/ | "-" | 1 | 20181101 |
+---------------------------------------+-------------------------------------+--------------------------------+---------------------------------+--------------------------------+---------------------------------+----------------------------------------------------+------------------------------------+---------------------------------+--+
--符合逻辑
select count(session)/count(distinct(remote_addr)) as Average_access_frequency
from ods_click_stream_visit
where datestr='20181101';
+---------------------------+--+
| average_access_frequency |
+---------------------------+--+
| 1.0754716981132075 |
+---------------------------+--+
select * from ods_click_pageviews limit 10;
+---------------------------------------+----------------------------------+----------------------------------+---------------------------------+------------------------------+---------------------------------+------------------------------------+----------------------------------------------------+----------------------------------------------------+--------------------------------------+-----------------------------+------------------------------+--+
| ods_click_pageviews.session | ods_click_pageviews.remote_addr | ods_click_pageviews.remote_user | ods_click_pageviews.time_local | ods_click_pageviews.request | ods_click_pageviews.visit_step | ods_click_pageviews.page_staylong | ods_click_pageviews.http_referer | ods_click_pageviews.http_user_agent | ods_click_pageviews.body_bytes_sent | ods_click_pageviews.status | ods_click_pageviews.datestr |
+---------------------------------------+----------------------------------+----------------------------------+---------------------------------+------------------------------+---------------------------------+------------------------------------+----------------------------------------------------+----------------------------------------------------+--------------------------------------+-----------------------------+------------------------------+--+
| 7e81b5a1-8b54-437a-ab29-51b215b14fa9 | 1.80.249.223 | - | 2018-11-01 07:57:33 | /hadoop-hive-intro/ | 1 | 60 | "http://www.google.com.hk/url?sa=t&rct=j&q=hive%E7%9A%84%E5%AE%89%E8%A3%85&source=web&cd=2&ved=0CC4QFjAB&url=%68%74%74%70%3a%2f%2f%62%6c%6f%67%2e%66%65%6e%73%2e%6d%65%2f%68%61%64%6f%6f%70%2d%68%69%76%65%2d%69%6e%74%72%6f%2f&ei=5lw5Uo-2NpGZiQfCwoG4BA&usg=AFQjCNF8EFxPuCMrm7CvqVgzcBUzrJZStQ&bvm=bv.52164340,d.aGc&cad=rjt" | "Mozilla/5.0(WindowsNT5.2;rv:23.0)Gecko/20100101Firefox/23.0" | 14764 | 200 | 20181101 |
| 5ec73e05-f291-4996-b2d1-13f15cd8331c | 101.226.167.201 | - | 2018-11-01 09:30:36 | /hadoop-mahout-roadmap/ | 1 | 60 | "http://blog.fens.me/hadoop-mahout-roadmap/" | "Mozilla/4.0(compatible;MSIE8.0;WindowsNT6.1;Trident/4.0;SLCC2;.NETCLR2.0.50727;.NETCLR3.5.30729;.NETCLR3.0.30729;MediaCenterPC6.0;MDDR;.NET4.0C;.NET4.0E;.NETCLR1.1.4322;TabletPC2.0);360Spider" | 10335 | 200 | 20181101 |
| fb2c9ed1-09c0-442b-8903-5132b46250ba | 101.226.167.205 | - | 2018-11-01 09:30:32 | /hadoop-family-roadmap/ | 1 | 60 | "http://blog.fens.me/hadoop-family-roadmap/" | "Mozilla/4.0(compatible;MSIE8.0;WindowsNT6.1;Trident/4.0;SLCC2;.NETCLR2.0.50727;.NETCLR3.5.30729;.NETCLR3.0.30729;MediaCenterPC6.0;MDDR;.NET4.0C;.NET4.0E;.NETCLR1.1.4322;TabletPC2.0);360Spider" | 11715 | 200 | 20181101 |
| 6cf55c75-47b8-425a-83d1-8efc8c94e518 | 101.226.169.215 | - | 2018-11-01 10:07:31 | /about | 1 | 60 | "http://blog.fens.me/about" | "Mozilla/4.0(compatible;MSIE8.0;WindowsNT6.1;Trident/4.0;SLCC2;.NETCLR2.0.50727;.NETCLR3.5.30729;.NETCLR3.0.30729;MediaCenterPC6.0;MDDR;.NET4.0C;.NET4.0E;.NETCLR1.1.4322;TabletPC2.0);360Spider" | 5 | 301 | 20181101 |
| 182549fa-aca2-49ea-88ce-6aa238bbf1dd | 110.211.10.14 | - | 2018-11-01 13:31:10 | /hadoop-mahout-roadmap/ | 1 | 60 | "http://f.dataguru.cn/forum.php?mod=viewthread&tid=175501" | "Mozilla/4.0(compatible;MSIE8.0;WindowsNT6.1;WOW64;Trident/4.0;SLCC2;.NETCLR2.0.50727;.NETCLR3.5.30729;.NETCLR3.0.30729;MALN;InfoPath.2;.NET4.0C;MediaCenterPC6.0)" | 10335 | 200 | 20181101 |
| 53cd20ab-c17e-457b-af60-a385f847959a | 111.161.17.104 | - | 2018-11-01 12:17:25 | /hadoop-hive-intro/ | 1 | 60 | "http://blog.fens.me/series-hadoop-cloud/" | "Mozilla/5.0(WindowsNT6.2;WOW64)AppleWebKit/537.36(KHTML,likeGecko)Chrome/29.0.1547.66Safari/537.36" | 14763 | 200 | 20181101 |
| a7b62caf-f8bd-4ab8-a894-b66b12f8dc80 | 111.193.224.9 | - | 2018-11-01 07:17:25 | /hadoop-family-roadmap/ | 1 | 60 | "https://www.google.com.hk/" | "Mozilla/5.0(Macintosh;IntelMacOSX10_8_5)AppleWebKit/537.36(KHTML,likeGecko)Chrome/29.0.1547.57Safari/537.36" | 11715 | 200 | 20181101 |
| 1d5dec98-637b-45f1-9ada-58ae4fff7a9b | 112.65.193.16 | - | 2018-11-01 08:48:31 | /hadoop-mahout-roadmap/ | 1 | 60 | "-" | "Mozilla/4.0" | 38590 | 200 | 20181101 |
| ef5ce8f8-a505-49f0-8aad-ac20d49e2e18 | 113.107.237.31 | - | 2018-11-01 09:06:46 | /finance-rhive-repurchase/ | 1 | 60 | "-" | "-" | 45271 | 200 | 20181101 |
| 723d9fd4-851d-46a7-bb96-e3735889097f | 113.90.232.163 | - | 2018-11-02 00:58:00 | /hadoop-mahout-roadmap/ | 1 | 60 | "http://h2w.iask.cn/jump.php?url=http%3A%2F%2Fblog.fens.me%2Fhadoop-mahout-roadmap%2F" | "Mozilla/5.0(iPhone;CPUiPhoneOS6_0_1likeMacOSX)AppleWebKit/536.26(KHTML,likeGecko)Mobile/10A523" | 10321 | 200 | 20181101 |
+---------------------------------------+----------------------------------+----------------------------------+---------------------------------+------------------------------+---------------------------------+------------------------------------+----------------------------------------------------+----------------------------------------------------+--------------------------------------+-----------------------------+------------------------------+--+
--符合逻辑
select count(session)/count(distinct(remote_addr)) as Average_access_frequency
from ods_click_pageviews
where datestr='20181101';
+---------------------------+--+
| average_access_frequency |
+---------------------------+--+
| 1.4339622641509433 |
+---------------------------+--+
ods_click_pageviews:1.4339622641509433
ods_click_stream_visit:1.0754716981132075
为什么不相等,推测原因---》的session重复的
验证:
select count(distinct(session))/count(distinct(remote_addr)) as Average_access_frequency
from ods_click_pageviews
where datestr='20181101';
+---------------------------+--+
| average_access_frequency |
+---------------------------+--+
| 1.0754716981132075 |
+---------------------------+--+
测试结果ok
平均访问时长
--平均每次访问(会话)在网站上的停留时间。
--体现网站对访客的吸引程度。
--平均访问时长=访问总时长/访问次数。
先计算每次会话的停留时长
page_staylong
select session, sum(page_staylong) as web_staylong
from ods_click_pageviews
where datestr='20181101'
group by session;
--------------------------------------+---------------+--+
| session | web_staylong |
+---------------------------------------+---------------+--+
| 005fd135-d9ec-4ac2-ba16-706004359d42 | 60.0 |
| 00a9e4d8-dfb2-4d32-b180-eb2383112317 | 60.0 |
| 0173589c-2fbb-4d60-ad65-44d7468ec0ab | 60.0 |
| 065d5e7a-d7fe-45a3-b7b4-a5f053ecc4ab | 60.0 |
| 14c9ea27-dd75-476e-bea4-7f01d9ee4953 | 60.0 |
| 165938d8-2c27-4c57-b1e7-613a28d2f1d6 | 60.0 |
| 1784f12d-0b49-4c0e-b7e4-93dc39883091 | 60.0 |
| 182549fa-aca2-49ea-88ce-6aa238bbf1dd | 60.0 |
| 1ba35571-d9c0-4b26-bcd0-4999e395ae7f | 60.0 |
| 1d5dec98-637b-45f1-9ada-58ae4fff7a9b | 60.0 |
| 2899e25e-1f1b-4980-93e7-213b8beaee56 | 60.0 |
| 345a33da-e6a4-427f-bb53-c94dd42a9fa0 | 60.0 |
| 34a827ac-f52d-48ff-8779-29888ad22127 | 60.0 |
| 34f2bc2b-b33d-4c74-b4bf-992bb141f725 | 60.0 |
| 3e390e3e-6989-4432-9ecb-a951ba565a02 | 60.0 |
| 45aa2afd-db94-4be7-b14d-81c92d84817e | 60.0 |
| 4e2dc5f8-ab8d-4458-9867-75079360c716 | 333.0 |
| 4ffcf9e0-4384-46c7-8b24-4501e3dd388c | 60.0 |
| 53cd20ab-c17e-457b-af60-a385f847959a | 60.0 |
| 54e8d444-28a4-483c-81bb-1ebbf6934992 | 60.0 |
| 5a27951d-7413-4690-889f-09d358a6fc36 | 1303.0 |
| 5ec73e05-f291-4996-b2d1-13f15cd8331c | 60.0 |
| 64bd4724-7d02-437b-a157-a936e6461b24 | 1441.0 |
| 651052ed-baa4-42c6-b090-374d111b332c | 60.0 |
| 657e0608-5dac-4d1b-a2dd-83bd2ff3e2bc | 182.0 |
| 6623086d-dda5-4e18-a455-ac318b575158 | 60.0 |
| 6b4aa305-25ee-4b4a-bd25-4faa3c426c0e | 60.0 |
| 6b633951-59ee-4e21-9220-c6b0527c2280 | 111.0 |
| 6cf55c75-47b8-425a-83d1-8efc8c94e518 | 60.0 |
| 6d60b7e3-581f-4a03-8170-c858811f3370 | 60.0 |
| 6da248b7-a9f0-4966-a2d8-87b4c0e40ee1 | 60.0 |
| 723d9fd4-851d-46a7-bb96-e3735889097f | 60.0 |
| 7e81b5a1-8b54-437a-ab29-51b215b14fa9 | 60.0 |
| 7efdf5c0-3ffb-41e3-adcc-4a35d1f730a6 | 60.0 |
| 965e0160-9edb-4df8-a1d4-52410f4b7b74 | 60.0 |
| 990213f7-d999-47f3-bddc-304753fed7e4 | 629.0 |
| 9c02530f-8e52-4134-a925-bdef9abbbcde | 1668.0 |
| a7422b4f-2b63-47d8-b01b-b74ff8dca107 | 60.0 |
| a763ba11-b541-43e0-9447-6f184dbb56d2 | 61.0 |
| a7b62caf-f8bd-4ab8-a894-b66b12f8dc80 | 60.0 |
| af0c8899-fe97-4ed2-85ff-27941d4ec965 | 60.0 |
| b2a36031-1960-4175-87e1-143bc4ce7ea1 | 60.0 |
| b3925600-7533-4f52-9959-16b72f71c3fb | 60.0 |
| bc0189d0-210c-4edd-98ca-d6d4528682c8 | 60.0 |
| bc72c9ea-8bc3-48a9-8bc4-4b96742bbb3b | 1606.0 |
| c25c79a9-94b8-4d5c-a245-262c32373e55 | 60.0 |
| c92e4fb1-ecc1-4765-9ce2-08c5c6e0df66 | 60.0 |
| cff0ae91-c947-41bc-8684-eeee36a1b45e | 60.0 |
| d53726e9-23cd-4709-a2b9-556833683646 | 1535.0 |
| d6504de9-49e9-4784-bf4e-3d1a0019d642 | 60.0 |
| dc8ebf30-cb6d-47ab-9b19-d6b2b0379efa | 60.0 |
| e941709a-289a-401f-b892-a3b1a8f03399 | 60.0 |
| ee501555-6ff3-4be1-b35b-1f299705988e | 60.0 |
| eeac30bd-8a78-4f0e-af34-8a5ab02509cf | 60.0 |
| ef5ce8f8-a505-49f0-8aad-ac20d49e2e18 | 60.0 |
| f0c4a0a1-c683-478e-a627-b754a161db58 | 412.0 |
| fb2c9ed1-09c0-442b-8903-5132b46250ba | 60.0 |
+---------------------------------------+---------------+--+
计算平均访问时长
select sum(a.web_staylong)/count(a.session)
from
(select session, sum(page_staylong) as web_staylong
from ods_click_pageviews
where datestr='20181101'
group by session) a;
+---------------------+--+
| _c0 |
+---------------------+--+
| 211.24561403508773 |
+---------------------+--+
1 row selected (61.213 seconds)
--注意:sum求和,count累加
跳出率
--跳出率是指用户到网站上仅浏览了一个页面就离开的访问次数与所有访问次数的百分比。
--是评价网站性能的重要指标。
/hadoop-mahout-roadmap/ 页面跳出率
select count(*) from ods_click_stream_visit where datestr ="20181101";
+------+--+
| _c0 |
+------+--+
| 57 |
+------+--+
1 row selected (30.667 seconds)
select vv from dw_webflow_basic_info where datestr ="20181101";
+-----+--+
| vv |
+-----+--+
| 57 |
+-----+--+
1 row selected (0.119 seconds)
浏览/hadoop-mahout-roadmap/一个页面 并且离开的人数
select count(*) from ods_click_stream_visit where datestr ="20181101"
and pagevisits = 1 and outpage = "/hadoop-mahout-roadmap/";
+-------+--+
| nums |
+-------+--+
| 11 |
+-------+--+
1 row selected (30.299 seconds)
合并计算结果:
select
(b.nums/a.vv)*100
from dw_webflow_basic_info a join (select count(*) as nums from ods_click_stream_visit where datestr ="20181101"
and pagevisits = 1 and outpage = "/hadoop-mahout-roadmap/") b;
+---------------------+--+
| _c0 |
+---------------------+--+
| 19.298245614035086 |
+---------------------+--+
1 row selected (58.57 seconds)