5 years ago · 09e846ed77
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,7 @@
 
																+.idea/
															
 
																+/out/
															
 
																+*/__pycache__/
															
 
																+/venv/
															
 
																+/全部户型-镜像/*
															
 
																+/algorithm/file/
															
 
																+/resources/need_finish_files/*
															
--- a/__pycache__/excel_util.cpython-36.pyc
+++ b/__pycache__/excel_util.cpython-36.pyc
--- a/__pycache__/excel_util.cpython-37.pyc
+++ b/__pycache__/excel_util.cpython-37.pyc
--- a/__pycache__/flask_app.cpython-36.pyc
+++ b/__pycache__/flask_app.cpython-36.pyc
--- a/__pycache__/mvp.cpython-36.pyc
+++ b/__pycache__/mvp.cpython-36.pyc
--- a/__pycache__/mvp.cpython-37.pyc
+++ b/__pycache__/mvp.cpython-37.pyc
--- a/__pycache__/mysql_db.cpython-36.pyc
+++ b/__pycache__/mysql_db.cpython-36.pyc
--- a/__pycache__/mysql_db.cpython-37.pyc
+++ b/__pycache__/mysql_db.cpython-37.pyc
--- a/db/__pycache__/mysql_db.cpython-37.pyc
+++ b/db/__pycache__/mysql_db.cpython-37.pyc
--- a/utils/excel_util.py
+++ b/utils/excel_util.py
@@ -6,13 +6,14 @@ import os
 
																 class ExcelUtil:
															
 
																     # 当前项目路径
															
 
																-    dir_path = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) + r'\resources'
															
 
																+    dir_path = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) + r'/elab_mvp/resources'
															
 
																     """
															
 
																         解析excel文件
															
 
																     """
															
 
																-    def __init__(self, sheet_name=None, path=None):
															
 
																-        if path:
															
 
																-            self.path = path
															
 
																+
															
 
																+    def __init__(self, sheet_name=None, file_name=None):
															
 
																+        if file_name:
															
 
																+            self.path = os.path.join(self.dir_path, file_name)
															
 
																         else:
															
 
																             self.path = os.path.join(self.dir_path, 'mvp.xlsx')
															
 
																         if sheet_name:
															
@@ -73,31 +74,72 @@ class ExcelUtil:
 
																         """
															
 
																         rows = [row for row in self.read_excel_by_ox().rows][24:]
															
 
																         tag_name = None
															
 
																+        tag_type = None
															
 
																         datas = []
															
 
																         for row in rows:
															
 
																+            tag_type_1 = row[0].value
															
 
																             tag = row[1].value
															
 
																             values = row[3].value
															
 
																             corr = row[4].value
															
 
																+            if tag_type_1:
															
 
																+                tag_type = tag_type_1
															
 
																             if tag:
															
 
																                 tag_name = tag
															
 
																             if values is not None:
															
 
																-                datas.append([tag_name, values, corr])
															
 
																+                datas.append([tag_type, tag_name, values, corr])
															
 
																         result = {}
															
 
																-        for name, items in groupby(datas, key=lambda obj: obj[0]):
															
 
																-            orders = []
															
 
																-            for n in items:
															
 
																-                orders.append([n[1], n[2]])
															
 
																-            result[name] = orders
															
 
																+        datas.sort(key=lambda obj: obj[0])
															
 
																+        for tag_type, sub_datas in groupby(datas, key=lambda obj: obj[0]):
															
 
																+            sub_list = [x for x in sub_datas]
															
 
																+            sub_list.sort(key=lambda obj: obj[1])
															
 
																+            sub_result = {}
															
 
																+            for name, items in groupby(sub_list, key=lambda obj: obj[1]):
															
 
																+                orders = []
															
 
																+                for n in items:
															
 
																+                    orders.append([n[2], n[3]])
															
 
																+                sub_result[name] = orders
															
 
																+            result[tag_type] = sub_result
															
 
																         return result
															
 
																+    def init_scores(self):
															
 
																+        work_sheet = self.read_excel_by_ox()
															
 
																+        rows = [row for row in work_sheet.rows]
															
 
																+        datas = []
															
 
																+        for row in rows[1:]:
															
 
																+            if row[0].value is not None:
															
 
																+                datas.append([row[0].value, row[1].value, row[2].value, row[3].value, row[4].value])
															
 
																+        return datas
															
 
																-if __name__ == '__main__':
															
 
																-    # eu = ExcelUtil()
															
 
																-    # results = eu.init_mvp_data()
															
 
																-    # for key in results.keys():
															
 
																-    #     print(key)
															
 
																-    #     print('     {}'.format(results[key]))
															
 
																-    #     print('-'*40)
															
 
																-    import os
															
 
																-    dir_path = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
															
 
																-    print(dir_path)
															
 
																+    def init_module_info(self):
															
 
																+        work_sheet = self.read_excel_by_ox()
															
 
																+        max_column = work_sheet.max_column
															
 
																+        rows = [row for row in work_sheet.rows][3:]
															
 
																+        crowd_name = None
															
 
																+        datas = []
															
 
																+        for row in rows:
															
 
																+            crowd = row[1].value
															
 
																+            if crowd is not None:
															
 
																+                crowd_name = crowd
															
 
																+            behavior = row[2].value
															
 
																+            score = row[4].value
															
 
																+            for index in range(6, max_column - 1, 2):
															
 
																+                module_name = row[index].value
															
 
																+                if module_name is not None:
															
 
																+                    weight = row[index + 1].value
															
 
																+                    datas.append([crowd_name, behavior, score, module_name, weight])
															
 
																+        results = {}
															
 
																+        datas.sort(key=lambda obj: obj[0])
															
 
																+        for name, items in groupby(datas, key=lambda obj: obj[0]):
															
 
																+            sub_results = {}
															
 
																+            sub_list = []
															
 
																+            for it in items:
															
 
																+                sub_list.append([x for x in it])
															
 
																+            sub_list.sort(key=lambda obj: obj[3])
															
 
																+            for name_1, itmes_1 in groupby(sub_list, key=lambda obj: obj[3]):
															
 
																+                sub_data = []
															
 
																+                for n in itmes_1:
															
 
																+                    # print('         {}'.format(n[1]))
															
 
																+                    sub_data.append([n[1], n[2], n[4]])
															
 
																+                sub_results[name_1] = sub_data
															
 
																+            results[name] = sub_results
															
 
																+        return results
															
--- a/flask_app.py
+++ b/flask_app.py
@@ -1,599 +1,10 @@
 
																-from flask import Flask, request, render_template, jsonify
															
 
																-import os
															
 
																-from werkzeug.utils import secure_filename
															
 
																-import time
															
 
																+from flask import Flask, request
															
 
																+from mvp import Mvp
															
 
																 import json
															
 
																-import pandas as pd
															
 
																-import openpyxl as ox
															
 
																-from itertools import groupby
															
 
																-import os
															
 
																-import pymysql as ps
															
 
																 app = Flask(__name__)
															
 
																-class Mvp:
															
 
																-    """
															
 
																-     ce mvp 答题数据统计
															
 
																-     城市特例 北京市，上海市， 重庆市，天津市
															
 
																-    """
															
 
																-
															
 
																-    age_dict = {
															
 
																-        '00-04年生': '00后',
															
 
																-        '05-09年生': '05后',
															
 
																-        '50-59年生': '50后',
															
 
																-        '60-69年生': '60后',
															
 
																-        '70-74年生': '70后',
															
 
																-        '75-79年生': '75后',
															
 
																-        '80-84年生': '80后',
															
 
																-        '85-89年生': '85后',
															
 
																-        '90-94年生': '90后',
															
 
																-        '95-99年生': '95后'
															
 
																-    }
															
 
																-
															
 
																-    crowd = ['A', 'B', 'C', 'D', 'E', 'F']
															
 
																-
															
 
																-    # 获取答题记录中城市列表
															
 
																-    sql_1 = 'select city from f_t_daren_score_2 group by city'
															
 
																-
															
 
																-    # 获取父选项和父题id
															
 
																-    sql_2 = 'select a.id, a.content, b.id, b.name from bq_option a left join bq_question b on a.question_id = b.id ' \
															
 
																-            'where a.serial_number = %s and b.serial_number = %s and a.status = b.status = 1 '
															
 
																-
															
 
																-    # 获取答题人的年龄段集合
															
 
																-    sql_4 = 'select nld from f_t_daren_score_2 group by nld'
															
 
																-
															
 
																-    # 根据城市，年龄段，人群分类统计答题记录数
															
 
																-    sql_5 = 'select group_type, COUNT(uuid) from f_t_daren_score_2 where (city = %s or province = %s) and nld ' \
															
 
																-            '= %s and uuid in %s group by group_type '
															
 
																-
															
 
																-    # 根据父选项获取子选项id列表
															
 
																-    sql_6 = 'SELECT c.id, c.sub_question_id, c.content FROM bq_sub_option c WHERE c.father_id in (SELECT a.id FROM ' \
															
 
																-            'bq_option a ' \
															
 
																-            'LEFT JOIN bq_question b ON a.question_id = b.id WHERE a.serial_number = %s AND b.serial_number = %s ' \
															
 
																-            'and a.status = 1 and b.status = 1) and c.status = 1 '
															
 
																-
															
 
																-    # 根据子题id获取包含子题id的测试
															
 
																-    sql_7 = 'select group_type from bq_testcase where status = 1 and FIND_IN_SET(%s, question_ids)'
															
 
																-
															
 
																-    # 根据子选项id统计答题数
															
 
																-    sql_8 = 'SELECT count(1) FROM f_t_daren_score_2 a LEFT JOIN d_shangju_tiku_02 b ON a.sub_question_id = ' \
															
 
																-            'b.sub_question_id AND a.score  = b.score and a.testcase_id = b.testcase_id WHERE b.sub_option_id in %s' \
															
 
																-            'and (a.city = %s or a.province = %s) and a.nld = %s and a.uuid in %s'
															
 
																-
															
 
																-    # 获取一个uuid下答题的子选项id列表
															
 
																-    sql_10 = 'select  DISTINCT uuid, GROUP_CONCAT(DISTINCT b.sub_option_id)  from f_t_daren_score_2 a left join ' \
															
 
																-             'd_shangju_tiku_02 b on a.sub_question_id = b.sub_question_id and a.score = b.score where a.status = ' \
															
 
																-             'b.status = 1 group by uuid '
															
 
																-
															
 
																-    # 向表mvp_crowd_info插入数据
															
 
																-    sql_11 = 'insert into mvp_crowd_info(age_area, city_name, crowd_type, status) values(%s, %s, %s, 1)'
															
 
																-
															
 
																-    # 向表mvp_crowd_info_behavior中插入数据
															
 
																-    sql_12 = 'insert into mvp_crowd_info_behavior(crowd_info_id, behavioral_interest, standard_value, status) values(' \
															
 
																-             '%s, %s, ' \
															
 
																-             '%s, 1) '
															
 
																-
															
 
																-    # 向表mvp_crowd_info_module中插入数据
															
 
																-    sql_13 = 'insert into mvp_crowd_info_module(crowd_info_id, module_name, standard_value, status) values (%s, %s, ' \
															
 
																-             '%s, 1) '
															
 
																-
															
 
																-    sql_14 = 'select a.id, a.age_area, a.city_name, a.crowd_type from mvp_crowd_info a where a.status = 1'
															
 
																-
															
 
																-    def __init__(self, path=None):
															
 
																-        self.shangju_db = MysqlDB('shangju')
															
 
																-        self.marketing_db = MysqlDB('bi_report')
															
 
																-        # self.shangju_db.truncate('mvp_standard_score')
															
 
																-        self.tag_data = ExcelUtil(file_name=path).init_mvp_data()
															
 
																-        self.crowd_info = ExcelUtil(file_name=path, sheet_name='选项-人群分类对应表').init_crowd_info()
															
 
																-        self.citys = self.init_city()
															
 
																-        self.age = self.init_age()
															
 
																-        self.people_sub_option_ids = self.marketing_db.select(self.sql_10)
															
 
																-        self.crowd_contain_sub_option_ids = self.get_crowd_contain_sub_option_ids()
															
 
																-        self.module_scores = ExcelUtil(file_name='set-behavior-tag.xlsx', sheet_name='算法关系表').init_module_info()
															
 
																-        # self.scores_tag = ExcelUtil(file_name='行为与模块分值汇总.xlsx', sheet_name='行为').init_scores()
															
 
																-        # self.score_module = ExcelUtil(file_name='行为与模块分值汇总.xlsx', sheet_name='模块').init_scores()
															
 
																-        self.scores_tag = None
															
 
																-        self.score_module = None
															
 
																-
															
 
																-
															
 
																-    def init_city(self):
															
 
																-        """
															
 
																-            获取答题数据中的城市。
															
 
																-        :return:
															
 
																-        """
															
 
																-        citys = ['北京市', '上海市', '重庆市', '天津市']
															
 
																-        citys_info = self.marketing_db.select(self.sql_1)
															
 
																-        citys.extend([x[0] for x in citys_info if x[0] is not None])
															
 
																-        return citys
															
 
																-
															
 
																-    def query_behavioral_info(self, city=None, age=None, crowd=None):
															
 
																-        """
															
 
																-            查询行为兴趣信息
															
 
																-        :return:
															
 
																-        """
															
 
																-        # datas = []
															
 
																-        # for key in self.tag_data.keys():
															
 
																-        #     values = self.tag_data[key]
															
 
																-        #     for value in values:
															
 
																-        #         question = value[0].split('-')[0]
															
 
																-        #         option = value[0].split('-')[1]
															
 
																-        #         corr = value[1]
															
 
																-        #         data = self.shangju_db.select(self.sql_2, [option, question])
															
 
																-        #         if len(data) > 0:
															
 
																-        #             print([question, option, data[0][3], data[0][1], key, corr])
															
 
																-        #             datas.append([question, option, data[0][3], data[0][1], key, corr])
															
 
																-        # self.shangju_db.truncate('mvp_question_classification')
															
 
																-        # self.shangju_db.add_some(self.sql_3, datas)
															
 
																-        scores_behavioral = self.city_age_crowd(city, age, crowd)
															
 
																-        # scores_module = self.module_score(crowd, city, age, scores_behavioral['score'])
															
 
																-        # result = {'行为兴趣分值': scores_behavioral['score'], '模块分值': scores_module}
															
 
																-        print('update finished!!!')
															
 
																-        return scores_behavioral
															
 
																-
															
 
																-    def module_score(self, crowd, city, age, scores):
															
 
																-        """
															
 
																-            模块分数计算
															
 
																-            城市 年龄 人群分类 模块名称 分数
															
 
																-        :return:
															
 
																-        """
															
 
																-        modules = self.module_scores[crowd]
															
 
																-        result = []
															
 
																-        for key in modules.keys():
															
 
																-            values = modules[key]
															
 
																-            module_name = key
															
 
																-            score = 0
															
 
																-            for value in values:
															
 
																-                behavioral_name = value[0]
															
 
																-                weight = float(value[2])
															
 
																-                standard_score = [x[4] for x in scores if x[2] == behavioral_name]
															
 
																-                if len(standard_score) > 0:
															
 
																-                    score += standard_score[0] * weight
															
 
																-            result.append([city, age, crowd, module_name, score])
															
 
																-        return result
															
 
																-
															
 
																-    # def insert_data(self, scores_behavioral, scores_module):
															
 
																-    def insert(self):
															
 
																-        """
															
 
																-            计算数据写入数据库中，供接口查看
															
 
																-        :return:
															
 
																-        """
															
 
																-        infos = []
															
 
																-        for city in ['上海市', '宁波市', '苏州市', '杭州市', ' 无锡市']:
															
 
																-            for age in ['50-59年生', '60-69年生', '70-74年生', '75-79年生', '80-84年生', '85-89年生', '90-94年生', '95-99年生', '00'
															
 
																-                                                                                                                '-04年生', '05-09年生']:
															
 
																-                for c_type in ['A', 'B', 'C', 'D', 'E', 'F']:
															
 
																-                    age_area = self.age_dict.get(age)
															
 
																-                    if age_area:
															
 
																-                        infos.append([age_area, city, c_type])
															
 
																-        self.shangju_db.add_some(self.sql_11, infos)
															
 
																-
															
 
																-    def query_data(self):
															
 
																-        ids = self.shangju_db.select(self.sql_14)
															
 
																-        return ids
															
 
																-
															
 
																-    def shanghai_85_module_score_insert(self):
															
 
																-        """
															
 
																-            上海市，85后模块分数计算
															
 
																-        :return:
															
 
																-        """
															
 
																-        result = []
															
 
																-        for crowd in self.crowd:
															
 
																-            modules = self.module_scores[crowd]
															
 
																-            for key in modules.keys():
															
 
																-                values = modules[key]
															
 
																-                module_name = key
															
 
																-                score = 0
															
 
																-                for value in values:
															
 
																-                    behavioral_name = value[0]
															
 
																-                    weight = float(value[2])
															
 
																-                    # standard_score = [x[4] for x in scores if x[2] == behavioral_name]
															
 
																-                    standard_score = float(value[1])
															
 
																-                    if standard_score is not None:
															
 
																-                        score += standard_score * weight
															
 
																-                result.append(['上海市', '85后', crowd, module_name, score])
															
 
																-        return {'score': result, 'data': self.module_scores}
															
 
																-
															
 
																-    def tag_module_score_insert(self):
															
 
																-        """
															
 
																-            标签模块分数写入数据库
															
 
																-        :return:
															
 
																-        """
															
 
																-        ids = self.query_data()
															
 
																-        insert_data = []
															
 
																-        insert_data_1 = []
															
 
																-        for tag, module in zip(self.scores_tag, self.score_module):
															
 
																-            city = tag[0]
															
 
																-            age = tag[1]
															
 
																-            crowd = tag[2]
															
 
																-            tag_name = tag[3]
															
 
																-            tag_score = tag[4]
															
 
																-
															
 
																-            city_2 = module[0]
															
 
																-            age_2 = module[1]
															
 
																-            crowd_2 = module[2]
															
 
																-            module_name_2 = module[3]
															
 
																-            module_score_2 = module[4]
															
 
																-
															
 
																-            for id in ids:
															
 
																-                city_1 = id[2]
															
 
																-                age_1 = id[1]
															
 
																-                crowd_1 = id[3]
															
 
																-                id_1 = id[0]
															
 
																-                if city == city_1 and self.age_dict[age] == age_1 and crowd == crowd_1:
															
 
																-                    insert_data.append([id_1, tag_name, tag_score])
															
 
																-                if city_2 == city_1 and self.age_dict[age_2] == age_1 and crowd_2 == crowd_1:
															
 
																-                    insert_data_1.append([id_1, module_name_2, module_score_2])
															
 
																-        self.shangju_db.add_some(self.sql_12, insert_data)
															
 
																-        self.shangju_db.add_some(self.sql_13, insert_data_1)
															
 
																-
															
 
																-    def init_age(self):
															
 
																-        """
															
 
																-           获取答题数据中的年龄
															
 
																-        """
															
 
																-        age_info = self.marketing_db.select(self.sql_4)
															
 
																-        # print([x[0] for x in age_info])
															
 
																-        return [x[0] for x in age_info if x[0] is not None]
															
 
																-
															
 
																-    def city_age_crowd(self, city=None, age=None, crowd=None):
															
 
																-        data_start = []
															
 
																-        result = []
															
 
																-        module_scores = []
															
 
																-        if city is not None and age is not None and crowd is not None:
															
 
																-            print('获取指定城市，年龄段，人群类型的数据...')
															
 
																-            people_uuids = self.get_people_uuid_by_type(crowd)
															
 
																-            if len(people_uuids) > 0:
															
 
																-                print('{}-{}-{}'.format(city, age, crowd))
															
 
																-                datas = self.behavior_tag_init(city, age, people_uuids)
															
 
																-                data_start.append(datas)
															
 
																-                result.extend(self.calculation_standard_score(datas, city, age, crowd))
															
 
																-            module_scores.extend(self.module_score(crowd, city, age, result))
															
 
																-            pass
															
 
																-        else:
															
 
																-            print('获取所有case的数据...')
															
 
																-            # for city in self.citys:
															
 
																-            # for city in [city]:
															
 
																-            for age in self.age:
															
 
																-                for crowd_type in self.crowd:
															
 
																-                    if age == '85-89年生' and city == '上海市':
															
 
																-                        print('上海市85后数据导入人工值，无需计算...')
															
 
																-                        pass
															
 
																-                    else:
															
 
																-                        # print(' {}{}'.format(city, age))
															
 
																-                        people_uuids = self.get_people_uuid_by_type(crowd_type)
															
 
																-                        if len(people_uuids) > 0:
															
 
																-                            print('{}-{}-{}'.format(city, age, crowd_type))
															
 
																-                            datas = self.behavior_tag_init(city, age, people_uuids)
															
 
																-                            data_start.append(datas)
															
 
																-                            result.extend(self.calculation_standard_score(datas, city, age, crowd_type))
															
 
																-                        module_scores.extend(self.module_score(crowd_type, city, age, result))
															
 
																-        # return result
															
 
																-        # data_list = []
															
 
																-        # for e in data_start:
															
 
																-        #     for key in e.keys():
															
 
																-        #         values = e[key]
															
 
																-        #         for sub_e in values:
															
 
																-        #             ele = [key]
															
 
																-        #             ele.extend(sub_e)
															
 
																-        #             data_list.append(ele)
															
 
																-        #     pass
															
 
																-        return {'tag_score': result, 'module_score': module_scores}
															
 
																-        # return {'score': result, 'data': data_list}
															
 
																-
															
 
																-    def behavior_tag_init(self, city, age, people_uuids):
															
 
																-        result = {}
															
 
																-        self.group_type_count = self.marketing_db.select(self.sql_5, [city, city, age, people_uuids])
															
 
																-        for key in self.tag_data:
															
 
																-            values = self.tag_data[key]
															
 
																-            elements = []
															
 
																-            for value in values:
															
 
																-                question = value[0].split('-')[0]
															
 
																-                option = value[0].split('-')[1]
															
 
																-                corr = value[1]
															
 
																-                fz, fm = self.molecular_value(question, option, city, age, people_uuids)
															
 
																-                if fm == 0:
															
 
																-                    c = 0
															
 
																-                else:
															
 
																-                    c = fz / fm
															
 
																-                elements.append([question, option, corr, fz, fm, c])
															
 
																-            result[key] = elements
															
 
																-        return self.indicator_calculation_d_e(result)
															
 
																-
															
 
																-    def molecular_value(self, queston, option, city, age, people_uuids):
															
 
																-        # 获取当前父选项包含的子选项id和子题id列表
															
 
																-        result = self.shangju_db.select(self.sql_6, [option, queston])
															
 
																-        sub_option_ids = []
															
 
																-        group_types = []
															
 
																-        for rt in result:
															
 
																-            sub_option_id, sub_question_id, content = rt[0], rt[1], rt[2]
															
 
																-            grouptypes = self.shangju_db.select(self.sql_7, [sub_question_id])
															
 
																-            for g_t in grouptypes:
															
 
																-                if g_t[0] not in group_types:
															
 
																-                    group_types.append(g_t[0])
															
 
																-            sub_option_ids.append(sub_option_id)
															
 
																-        # 计算子选项在答题记录中的点击数
															
 
																-        sub_options_count = 0
															
 
																-        if len(sub_option_ids) > 0:
															
 
																-            result_1 = self.marketing_db.select(self.sql_8, [sub_option_ids, city, city, age, people_uuids])
															
 
																-            sub_options_count = result_1[0][0]
															
 
																-        # 计算父选项包含的子选项对应的子题所在的测试gt包含的点击数。
															
 
																-        denominator_value = 0
															
 
																-        for info in self.group_type_count:
															
 
																-            if info[0] in group_types:
															
 
																-                denominator_value += info[1]
															
 
																-        return sub_options_count, denominator_value
															
 
																-
															
 
																-    def indicator_calculation_d_e(self, data):
															
 
																-        result = {}
															
 
																-        for key in data.keys():
															
 
																-            values = data[key]
															
 
																-            c_list = []
															
 
																-            for x in values:
															
 
																-                _x = x[5]
															
 
																-                if _x is not None and x != 0:
															
 
																-                    c_list.append(_x)
															
 
																-            fm_list = [x[4] for x in values]
															
 
																-            sum_c = sum(fm_list)
															
 
																-            if len(c_list) == 0:
															
 
																-                min_c = 0
															
 
																-            else:
															
 
																-                min_c = min(c_list)
															
 
																-            elements = []
															
 
																-            for value in values:
															
 
																-                _value = []
															
 
																-                c = value[5]
															
 
																-                if sum_c == 0:
															
 
																-                    d = 0
															
 
																-                else:
															
 
																-                    d = c / sum_c
															
 
																-                e = c - min_c
															
 
																-                _value.extend(value)
															
 
																-                _value.append(d)
															
 
																-                _value.append(e)
															
 
																-                elements.append(_value)
															
 
																-            result[key] = elements
															
 
																-        return result
															
 
																-
															
 
																-    def calculation_standard_score(self, datas, city, age, crowd_type):
															
 
																-        scores = []
															
 
																-        for key in datas.keys():
															
 
																-            print(key)
															
 
																-            print('     父题序号 父选项序号 相关系系数 分子值 分母值 百分比 人数权重 偏离值')
															
 
																-            values = [x[5] for x in datas[key]]
															
 
																-            min_c = min(values)
															
 
																-            f = min_c
															
 
																-            for value in datas[key]:
															
 
																-                print('     {}'.format(value))
															
 
																-                if value[2] is not None and value[7] is not None:
															
 
																-                    f += float(value[2] * value[7])
															
 
																-            print('     标准分：{}'.format(f))
															
 
																-            scores.append([city, age, key, crowd_type, f])
															
 
																-        # self.shangju_db.add_some(self.sql_9, scores)
															
 
																-        return scores
															
 
																-
															
 
																-    def get_crowd_people(self):
															
 
																-        result = {}
															
 
																-        for type in self.crowd:
															
 
																-            uuids = self.get_people_uuid_by_type(type)
															
 
																-            result[type] = len(uuids)
															
 
																-        return result
															
 
																-
															
 
																-    def get_people_uuid_by_type(self, type):
															
 
																-        uuids = []
															
 
																-        type_sub_option_ids = self.crowd_contain_sub_option_ids[type]
															
 
																-        for people in self.people_sub_option_ids:
															
 
																-            uuid = people[0]
															
 
																-            sub_option_ids = list(map(int, str(people[1]).split(',')))
															
 
																-            # list(set(a).intersection(set(b)))
															
 
																-            if len(list(set(sub_option_ids).intersection(set(type_sub_option_ids)))) > 0 and uuid not in uuids:
															
 
																-                uuids.append(uuid)
															
 
																-        return uuids
															
 
																-
															
 
																-    def get_crowd_contain_sub_option_ids(self):
															
 
																-        """
															
 
																-            获取ABCDEF人群包含的子选项id
															
 
																-        :return:
															
 
																-        """
															
 
																-        infos = {}
															
 
																-        for key in self.crowd_info.keys():
															
 
																-            values = self.crowd_info[key]
															
 
																-            sub_option_ids = []
															
 
																-            for value in values:
															
 
																-                if value is not None:
															
 
																-                    vals = str(value).split('-')
															
 
																-                    option, question = vals[1], vals[0]
															
 
																-                    query_result = self.shangju_db.select(self.sql_6, [option, question])
															
 
																-                    for qr in query_result:
															
 
																-                        sub_option_id, sub_question_id, content = qr[0], qr[1], qr[2]
															
 
																-                        sub_option_ids.append(int(sub_option_id))
															
 
																-            infos[key] = sub_option_ids
															
 
																-        print(infos)
															
 
																-        return infos
															
 
																-
															
 
																-
															
 
																-class ExcelUtil:
															
 
																-    # 当前项目路径
															
 
																-    dir_path = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) + r'/elab_mvp/resources'
															
 
																-    """
															
 
																-        解析excel文件
															
 
																-    """
															
 
																-
															
 
																-    def __init__(self, sheet_name=None, file_name=None):
															
 
																-        if file_name:
															
 
																-            self.path = os.path.join(self.dir_path, file_name)
															
 
																-        else:
															
 
																-            self.path = os.path.join(self.dir_path, 'mvp.xlsx')
															
 
																-        if sheet_name:
															
 
																-            self.sheet_name = sheet_name
															
 
																-        else:
															
 
																-            self.sheet_name = '硬标签+行为'
															
 
																-
															
 
																-    def read_excel_by_pd(self):
															
 
																-        df = pd.read_excel(self.path)
															
 
																-        data = df.head()
															
 
																-        print('获取到的数据{}'.format(data))
															
 
																-
															
 
																-    def read_excel_by_ox(self):
															
 
																-        work_book = ox.load_workbook(self.path, data_only=True)
															
 
																-        work_sheet = work_book.get_sheet_by_name(self.sheet_name)
															
 
																-        # print('max_row:{}, max_col:{}'.format(work_sheet.max_row, work_sheet.max_column))
															
 
																-        return work_sheet
															
 
																-
															
 
																-    def init_crowd_info(self):
															
 
																-        """
															
 
																-            整理不同人群包含的父选序号
															
 
																-        :return:
															
 
																-        """
															
 
																-        rows = [row for row in self.read_excel_by_ox().rows]
															
 
																-        crowd_a = []
															
 
																-        crowd_b = []
															
 
																-        crowd_c = []
															
 
																-        crowd_d = []
															
 
																-        crowd_e = []
															
 
																-        crowd_f = []
															
 
																-
															
 
																-        for row in rows[2:]:
															
 
																-            option = row[4].value
															
 
																-            a = row[6].value
															
 
																-            if a is not None and a == 1 and option not in crowd_a:
															
 
																-                crowd_a.append(option)
															
 
																-            b = row[7].value
															
 
																-            if b is not None and b == 1 and option not in crowd_b:
															
 
																-                crowd_b.append(option)
															
 
																-            c = row[8].value
															
 
																-            if c is not None and c == 1 and option not in crowd_d:
															
 
																-                crowd_c.append(option)
															
 
																-            d = row[9].value
															
 
																-            if d is not None and d == 1 and option not in crowd_d:
															
 
																-                crowd_d.append(option)
															
 
																-            e = row[10].value
															
 
																-            if e is not None and e == 1 and option not in crowd_e:
															
 
																-                crowd_e.append(option)
															
 
																-            f = row[11].value
															
 
																-            if f is not None and f == 1 and option not in crowd_f:
															
 
																-                crowd_f.append(option)
															
 
																-        return {'A': crowd_a, 'B': crowd_b, 'C': crowd_c, 'D': crowd_d, 'E': crowd_e, 'F': crowd_f}
															
 
																-
															
 
																-    def init_mvp_data(self):
															
 
																-        """
															
 
																-            获取每个标签包括的父题父选项编号
															
 
																-        :return:
															
 
																-        """
															
 
																-        rows = [row for row in self.read_excel_by_ox().rows][24:]
															
 
																-        tag_name = None
															
 
																-        datas = []
															
 
																-        for row in rows:
															
 
																-            tag = row[1].value
															
 
																-            values = row[3].value
															
 
																-            corr = row[4].value
															
 
																-            if tag:
															
 
																-                tag_name = tag
															
 
																-            if values is not None:
															
 
																-                datas.append([tag_name, values, corr])
															
 
																-        result = {}
															
 
																-        for name, items in groupby(datas, key=lambda obj: obj[0]):
															
 
																-            orders = []
															
 
																-            for n in items:
															
 
																-                orders.append([n[1], n[2]])
															
 
																-            result[name] = orders
															
 
																-        return result
															
 
																-
															
 
																-    def init_scores(self):
															
 
																-        work_sheet = self.read_excel_by_ox()
															
 
																-        rows = [row for row in work_sheet.rows]
															
 
																-        datas = []
															
 
																-        for row in rows[1:]:
															
 
																-            if row[0].value is not None:
															
 
																-                datas.append([row[0].value, row[1].value, row[2].value, row[3].value, row[4].value])
															
 
																-        return datas
															
 
																-
															
 
																-    def init_module_info(self):
															
 
																-        work_sheet = self.read_excel_by_ox()
															
 
																-        max_column = work_sheet.max_column
															
 
																-        rows = [row for row in work_sheet.rows][3:]
															
 
																-        crowd_name = None
															
 
																-        datas = []
															
 
																-        for row in rows:
															
 
																-            crowd = row[1].value
															
 
																-            if crowd is not None:
															
 
																-                crowd_name = crowd
															
 
																-            behavior = row[2].value
															
 
																-            score = row[4].value
															
 
																-            for index in range(6, max_column - 1, 2):
															
 
																-                module_name = row[index].value
															
 
																-                if module_name is not None:
															
 
																-                    weight = row[index + 1].value
															
 
																-                    datas.append([crowd_name, behavior, score, module_name, weight])
															
 
																-        results = {}
															
 
																-        datas.sort(key=lambda obj: obj[0])
															
 
																-        for name, items in groupby(datas, key=lambda obj: obj[0]):
															
 
																-            sub_results = {}
															
 
																-            sub_list = []
															
 
																-            for it in items:
															
 
																-                sub_list.append([x for x in it])
															
 
																-            sub_list.sort(key=lambda obj: obj[3])
															
 
																-            for name_1, itmes_1 in groupby(sub_list, key=lambda obj: obj[3]):
															
 
																-                sub_data = []
															
 
																-                for n in itmes_1:
															
 
																-                    # print('         {}'.format(n[1]))
															
 
																-                    sub_data.append([n[1], n[2], n[4]])
															
 
																-                sub_results[name_1] = sub_data
															
 
																-            results[name] = sub_results
															
 
																-        return results
															
 
																-
															
 
																-
															
 
																-class MysqlDB:
															
 
																-    """
															
 
																-        mysql操作
															
 
																-    """
															
 
																-    con = None
															
 
																-    cursor = None
															
 
																-
															
 
																-    def __init__(self, db_name):
															
 
																-        self.db_name = db_name
															
 
																-        self.con = ps.connect(host='172.19.189.136', port=3306, user='bi_etl', password='XPtpswuU5lwGo4kx',
															
 
																-                              db=self.db_name, charset='utf8')
															
 
																-        # self.con = ps.connect(host='192.168.0.13', port=3306, user='root', password='elab@123'
															
 
																-        #                       , db=self.db_name, charset='utf8')
															
 
																-        self.cursor = self.con.cursor()
															
 
																-
															
 
																-    def show_tables(self):
															
 
																-        self.cursor.execute('show tables')
															
 
																-        for talbe in self.cursor.fetchall():
															
 
																-            print(talbe)
															
 
																-
															
 
																-    def select(self, sql, params=None):
															
 
																-        if params:
															
 
																-            self.cursor.execute(sql, params)
															
 
																-        else:
															
 
																-            self.cursor.execute(sql)
															
 
																-        return self.cursor.fetchall()
															
 
																-
															
 
																-    def add_some(self, sql, data):
															
 
																-        try:
															
 
																-            self.cursor.executemany(sql, data)
															
 
																-            self.con.commit()
															
 
																-        except:
															
 
																-            print('数据插入异常...')
															
 
																-            self.con.rollback()
															
 
																-
															
 
																-    def add_one(self, sql, data):
															
 
																-        try:
															
 
																-            self.cursor.execute(sql, data)
															
 
																-            self.con.commit()
															
 
																-        except:
															
 
																-            self.con.rollback()
															
 
																-
															
 
																-    def truncate(self, table_name):
															
 
																-        sql = 'truncate table {}'.format(table_name)
															
 
																-        self.cursor.execute(sql)
															
 
																-        self.con.commit()
															
 
																-
															
 
																-    def close(self):
															
 
																-        self.cursor.close()
															
 
																-        self.con.close()
															
 
																-
															
 
																-
															
 
																 @app.route('/behavioral_statistics', methods=['GET', 'POST'])
															
 
																 def behavioral_statistics():
															
 
																     """
															
@@ -606,8 +17,7 @@ def behavioral_statistics():
 
																     print(city, age, crowd)
															
 
																     mvp = Mvp()
															
 
																     scores = mvp.query_behavioral_info(city, age, crowd)
															
 
																-    mvp.shangju_db.close()
															
 
																-    mvp.marketing_db.close()
															
 
																+    mvp.close()
															
 
																     return json.dumps(scores, ensure_ascii=False)
															
@@ -619,8 +29,7 @@ def get_city_age_crowd():
 
																     """
															
 
																     mvp = Mvp()
															
 
																     infos = {'城市': mvp.citys, '年龄段': mvp.age, '人群分类': mvp.crowd}
															
 
																-    mvp.shangju_db.close()
															
 
																-    mvp.marketing_db.close()
															
 
																+    mvp.close()
															
 
																     return json.dumps(infos, ensure_ascii=False)
															
@@ -632,8 +41,7 @@ def crowd_people():
 
																     """
															
 
																     mvp = Mvp()
															
 
																     people_count = mvp.get_crowd_people()
															
 
																-    mvp.shangju_db.close()
															
 
																-    mvp.marketing_db.close()
															
 
																+    mvp.close()
															
 
																     return json.dumps(people_count, ensure_ascii=False)
															
@@ -644,6 +52,7 @@ def set_behavior_tag():
 
																     :return:
															
 
																     """
															
 
																     mvp = Mvp()
															
 
																+    mvp.close()
															
 
																     return json.dumps(mvp.module_scores, ensure_ascii=False)
															
@@ -652,6 +61,7 @@ def insert_info():
 
																     mvp = Mvp()
															
 
																     mvp.insert()
															
 
																     query_data = mvp.query_data()
															
 
																+    mvp.close()
															
 
																     return json.dumps(query_data, ensure_ascii=False)
															
@@ -659,6 +69,7 @@ def insert_info():
 
																 def insert_score():
															
 
																     mvp = Mvp()
															
 
																     mvp.tag_module_score_insert()
															
 
																+    mvp.close()
															
 
																     return '!!!分数添加成功!!!'
															
@@ -666,9 +77,17 @@ def insert_score():
 
																 def shanghai_85():
															
 
																     mvp = Mvp()
															
 
																     data = mvp.shanghai_85_module_score_insert()
															
 
																+    mvp.close()
															
 
																     return json.dumps(data, ensure_ascii=False)
															
 
																+@app.route('/tag_tree', methods=['GET', 'POST'])
															
 
																+def tag_tree():
															
 
																+    mvp = Mvp()
															
 
																+    tags = mvp.tag_data
															
 
																+    return json.dumps(tags, ensure_ascii=False)
															
 
																+
															
 
																+
															
 
																 if __name__ == '__main__':
															
 
																     app.run(
															
 
																         host='0.0.0.0',
															
--- a/mvp.py
+++ b/mvp.py
@@ -0,0 +1,419 @@
 
																+from mysql_db import MysqlDB
															
 
																+from excel_util import ExcelUtil
															
 
																+
															
 
																+
															
 
																+class Mvp:
															
 
																+    """
															
 
																+     ce mvp 答题数据统计
															
 
																+     城市特例 北京市，上海市， 重庆市，天津市
															
 
																+    """
															
 
																+
															
 
																+    age_dict = {
															
 
																+        '00-04年生': '00后',
															
 
																+        '05-09年生': '05后',
															
 
																+        '50-59年生': '50后',
															
 
																+        '60-69年生': '60后',
															
 
																+        '70-74年生': '70后',
															
 
																+        '75-79年生': '75后',
															
 
																+        '80-84年生': '80后',
															
 
																+        '85-89年生': '85后',
															
 
																+        '90-94年生': '90后',
															
 
																+        '95-99年生': '95后'
															
 
																+    }
															
 
																+
															
 
																+    crowd = ['A', 'B', 'C', 'D', 'E', 'F']
															
 
																+
															
 
																+    # 获取答题记录中城市列表
															
 
																+    sql_1 = 'select city from f_t_daren_score_2 group by city'
															
 
																+
															
 
																+    # 获取父选项和父题id
															
 
																+    sql_2 = 'select a.id, a.content, b.id, b.name from bq_option a left join bq_question b on a.question_id = b.id ' \
															
 
																+            'where a.serial_number = %s and b.serial_number = %s and a.status = b.status = 1 '
															
 
																+
															
 
																+    # 获取答题人的年龄段集合
															
 
																+    sql_4 = 'select nld from f_t_daren_score_2 group by nld'
															
 
																+
															
 
																+    # 根据城市，年龄段，人群分类统计答题记录数
															
 
																+    sql_5 = 'select group_type, COUNT(uuid) from f_t_daren_score_2 where (city = %s or province = %s) and nld ' \
															
 
																+            '= %s and uuid in %s group by group_type '
															
 
																+
															
 
																+    # 根据父选项获取子选项id列表
															
 
																+    sql_6 = 'SELECT c.id, c.sub_question_id, c.content FROM bq_sub_option c WHERE c.father_id in (SELECT a.id FROM ' \
															
 
																+            'bq_option a ' \
															
 
																+            'LEFT JOIN bq_question b ON a.question_id = b.id WHERE a.serial_number = %s AND b.serial_number = %s ' \
															
 
																+            'and a.status = 1 and b.status = 1) and c.status = 1 '
															
 
																+
															
 
																+    # 根据子题id获取包含子题id的测试
															
 
																+    sql_7 = 'select group_type from bq_testcase where status = 1 and FIND_IN_SET(%s, question_ids)'
															
 
																+
															
 
																+    # 根据子选项id统计答题数
															
 
																+    sql_8 = 'SELECT count(1) FROM f_t_daren_score_2 a LEFT JOIN d_shangju_tiku_02 b ON a.sub_question_id = ' \
															
 
																+            'b.sub_question_id AND (a.score  = b.score or a.score = b.sub_option_id) and a.testcase_id = ' \
															
 
																+            'b.testcase_id WHERE b.sub_option_id in %s' \
															
 
																+            'and (a.city = %s or a.province = %s) and a.nld = %s and a.uuid in %s'
															
 
																+
															
 
																+    # 获取一个uuid下答题的子选项id列表
															
 
																+    sql_10 = 'select  DISTINCT uuid, GROUP_CONCAT(DISTINCT b.sub_option_id)  from f_t_daren_score_2 a left join ' \
															
 
																+             'd_shangju_tiku_02 b on a.sub_question_id = b.sub_question_id and (a.score = b.score or a.score = ' \
															
 
																+             'b.sub_option_id) where a.status = ' \
															
 
																+             'b.status = 1 group by uuid '
															
 
																+
															
 
																+    # 向表mvp_crowd_info插入数据
															
 
																+    sql_11 = 'insert into mvp_crowd_info(age_area, city_name, crowd_type, status) values(%s, %s, %s, 1)'
															
 
																+
															
 
																+    # 向表mvp_crowd_info_behavior中插入数据
															
 
																+    sql_12 = 'insert into mvp_crowd_info_behavior(crowd_info_id, behavioral_interest, standard_value, status) values(' \
															
 
																+             '%s, %s, ' \
															
 
																+             '%s, 1) '
															
 
																+
															
 
																+    # 向表mvp_crowd_info_module中插入数据
															
 
																+    sql_13 = 'insert into mvp_crowd_info_module(crowd_info_id, module_name, standard_value, status) values (%s, %s, ' \
															
 
																+             '%s, 1) '
															
 
																+
															
 
																+    sql_14 = 'select a.id, a.age_area, a.city_name, a.crowd_type from mvp_crowd_info a where a.status = 1'
															
 
																+
															
 
																+    def __init__(self, path=None):
															
 
																+        self.shangju_db = MysqlDB('shangju')
															
 
																+        self.marketing_db = MysqlDB('bi_report')
															
 
																+        # self.shangju_db.truncate('mvp_standard_score')
															
 
																+        self.tag_data = ExcelUtil(file_name=path).init_mvp_data()
															
 
																+        self.crowd_info = ExcelUtil(file_name=path, sheet_name='选项-人群分类对应表').init_crowd_info()
															
 
																+        self.citys = self.init_city()
															
 
																+        self.age = self.init_age()
															
 
																+        self.people_sub_option_ids = self.marketing_db.select(self.sql_10)
															
 
																+        self.crowd_contain_sub_option_ids = self.get_crowd_contain_sub_option_ids()
															
 
																+        self.module_scores = ExcelUtil(file_name='set-behavior-tag.xlsx', sheet_name='算法关系表').init_module_info()
															
 
																+        # self.scores_tag = ExcelUtil(file_name='行为与模块分值汇总.xlsx', sheet_name='行为').init_scores()
															
 
																+        # self.score_module = ExcelUtil(file_name='行为与模块分值汇总.xlsx', sheet_name='模块').init_scores()
															
 
																+        self.scores_tag = None
															
 
																+        self.score_module = None
															
 
																+
															
 
																+    def close(self):
															
 
																+        self.shangju_db.close()
															
 
																+        self.marketing_db.close()
															
 
																+
															
 
																+    def init_city(self):
															
 
																+        """
															
 
																+            获取答题数据中的城市。
															
 
																+        :return:
															
 
																+        """
															
 
																+        citys = ['宁波市', '上海市', '苏州市', '无锡市', '宁波市']
															
 
																+        # citys_info = self.marketing_db.select(self.sql_1)
															
 
																+        # citys.extend([x[0] for x in citys_info if x[0] is not None])
															
 
																+        return citys
															
 
																+
															
 
																+    def query_behavioral_info(self, city=None, age=None, crowd=None):
															
 
																+        """
															
 
																+            查询行为兴趣信息
															
 
																+        :return:
															
 
																+        """
															
 
																+        # datas = []
															
 
																+        # for key in self.tag_data.keys():
															
 
																+        #     values = self.tag_data[key]
															
 
																+        #     for value in values:
															
 
																+        #         question = value[0].split('-')[0]
															
 
																+        #         option = value[0].split('-')[1]
															
 
																+        #         corr = value[1]
															
 
																+        #         data = self.shangju_db.select(self.sql_2, [option, question])
															
 
																+        #         if len(data) > 0:
															
 
																+        #             print([question, option, data[0][3], data[0][1], key, corr])
															
 
																+        #             datas.append([question, option, data[0][3], data[0][1], key, corr])
															
 
																+        # self.shangju_db.truncate('mvp_question_classification')
															
 
																+        # self.shangju_db.add_some(self.sql_3, datas)
															
 
																+        scores_behavioral = self.city_age_crowd(city, age, crowd)
															
 
																+        # scores_module = self.module_score(crowd, city, age, scores_behavioral['score'])
															
 
																+        # result = {'行为兴趣分值': scores_behavioral['score'], '模块分值': scores_module}
															
 
																+        print('update finished!!!')
															
 
																+        return scores_behavioral
															
 
																+
															
 
																+    def module_score(self, crowd, city, age, scores):
															
 
																+        """
															
 
																+            模块分数计算
															
 
																+            城市 年龄 人群分类 模块名称 分数
															
 
																+        :return:
															
 
																+        """
															
 
																+        behavioral_score = scores['用户画像-行为兴趣']
															
 
																+        modules = self.module_scores[crowd]
															
 
																+        result = []
															
 
																+        for key in modules.keys():
															
 
																+            values = modules[key]
															
 
																+            module_name = key
															
 
																+            score = 0
															
 
																+            for value in values:
															
 
																+                behavioral_name = value[0]
															
 
																+                weight = float(value[2])
															
 
																+                standard_score = [x[4] for x in behavioral_score if x[2] == behavioral_name]
															
 
																+                if len(standard_score) > 0:
															
 
																+                    score += standard_score[0] * weight
															
 
																+            result.append([city, age, crowd, module_name, score])
															
 
																+        return result
															
 
																+
															
 
																+    # def insert_data(self, scores_behavioral, scores_module):
															
 
																+    def insert(self):
															
 
																+        """
															
 
																+            计算数据写入数据库中，供接口查看
															
 
																+        :return:
															
 
																+        """
															
 
																+        infos = []
															
 
																+        for city in ['上海市', '宁波市', '苏州市', '杭州市', ' 无锡市']:
															
 
																+            for age in ['50-59年生', '60-69年生', '70-74年生', '75-79年生', '80-84年生', '85-89年生', '90-94年生', '95-99年生', '00'
															
 
																+                                                                                                                '-04年生',
															
 
																+                        '05-09年生']:
															
 
																+                for c_type in ['A', 'B', 'C', 'D', 'E', 'F']:
															
 
																+                    age_area = self.age_dict.get(age)
															
 
																+                    if age_area:
															
 
																+                        infos.append([age_area, city, c_type])
															
 
																+        self.shangju_db.add_some(self.sql_11, infos)
															
 
																+
															
 
																+    def query_data(self):
															
 
																+        ids = self.shangju_db.select(self.sql_14)
															
 
																+        return ids
															
 
																+
															
 
																+    def shanghai_85_module_score_insert(self):
															
 
																+        """
															
 
																+            上海市，85后模块分数计算
															
 
																+        :return:
															
 
																+        """
															
 
																+        result = []
															
 
																+        for crowd in self.crowd:
															
 
																+            modules = self.module_scores[crowd]
															
 
																+            for key in modules.keys():
															
 
																+                values = modules[key]
															
 
																+                module_name = key
															
 
																+                score = 0
															
 
																+                for value in values:
															
 
																+                    behavioral_name = value[0]
															
 
																+                    weight = float(value[2])
															
 
																+                    # standard_score = [x[4] for x in scores if x[2] == behavioral_name]
															
 
																+                    standard_score = float(value[1])
															
 
																+                    if standard_score is not None:
															
 
																+                        score += standard_score * weight
															
 
																+                result.append(['上海市', '85后', crowd, module_name, score])
															
 
																+        return {'score': result, 'data': self.module_scores}
															
 
																+
															
 
																+    def tag_module_score_insert(self):
															
 
																+        """
															
 
																+            标签模块分数写入数据库
															
 
																+        :return:
															
 
																+        """
															
 
																+        ids = self.query_data()
															
 
																+        insert_data = []
															
 
																+        insert_data_1 = []
															
 
																+        for tag, module in zip(self.scores_tag, self.score_module):
															
 
																+            city = tag[0]
															
 
																+            age = tag[1]
															
 
																+            crowd = tag[2]
															
 
																+            tag_name = tag[3]
															
 
																+            tag_score = tag[4]
															
 
																+
															
 
																+            city_2 = module[0]
															
 
																+            age_2 = module[1]
															
 
																+            crowd_2 = module[2]
															
 
																+            module_name_2 = module[3]
															
 
																+            module_score_2 = module[4]
															
 
																+
															
 
																+            for id in ids:
															
 
																+                city_1 = id[2]
															
 
																+                age_1 = id[1]
															
 
																+                crowd_1 = id[3]
															
 
																+                id_1 = id[0]
															
 
																+                if city == city_1 and self.age_dict[age] == age_1 and crowd == crowd_1:
															
 
																+                    insert_data.append([id_1, tag_name, tag_score])
															
 
																+                if city_2 == city_1 and self.age_dict[age_2] == age_1 and crowd_2 == crowd_1:
															
 
																+                    insert_data_1.append([id_1, module_name_2, module_score_2])
															
 
																+        self.shangju_db.add_some(self.sql_12, insert_data)
															
 
																+        self.shangju_db.add_some(self.sql_13, insert_data_1)
															
 
																+
															
 
																+    def init_age(self):
															
 
																+        """
															
 
																+           获取答题数据中的年龄
															
 
																+        """
															
 
																+        age_info = self.marketing_db.select(self.sql_4)
															
 
																+        # print([x[0] for x in age_info])
															
 
																+        return [x[0] for x in age_info if x[0] is not None]
															
 
																+
															
 
																+    def city_age_crowd(self, city=None, age=None, crowd=None):
															
 
																+        data_start = []
															
 
																+        result = []
															
 
																+        module_scores = []
															
 
																+        if city is not None and age is not None and crowd is not None:
															
 
																+            print('获取指定城市，年龄段，人群类型的数据...')
															
 
																+            people_uuids = self.get_people_uuid_by_type(crowd)
															
 
																+            if len(people_uuids) > 0:
															
 
																+                print('{}-{}-{}'.format(city, age, crowd))
															
 
																+                datas = self.behavior_tag_init(city, age, people_uuids)
															
 
																+                data_start.append(datas)
															
 
																+                result.extend(self.calculation_standard_score(datas, city, age, crowd))
															
 
																+            module_scores.extend(self.module_score(crowd, city, age, result))
															
 
																+            pass
															
 
																+        else:
															
 
																+            print('获取所有case的数据...')
															
 
																+            # for city in self.citys:
															
 
																+            # for city in [city]:
															
 
																+            for age in self.age:
															
 
																+                for crowd_type in self.crowd:
															
 
																+                    if age == '85-89年生' and city == '上海市':
															
 
																+                        print('上海市85后数据导入人工值，无需计算...')
															
 
																+                        pass
															
 
																+                    else:
															
 
																+                        # print(' {}{}'.format(city, age))
															
 
																+                        people_uuids = self.get_people_uuid_by_type(crowd_type)
															
 
																+                        if len(people_uuids) > 0:
															
 
																+                            print('{}-{}-{}'.format(city, age, crowd_type))
															
 
																+                            datas = self.behavior_tag_init(city, age, people_uuids)
															
 
																+                            data_start.append(datas)
															
 
																+                            result.extend(self.calculation_standard_score(datas, city, age, crowd_type))
															
 
																+                        module_scores.extend(self.module_score(crowd_type, city, age, result))
															
 
																+        # return result
															
 
																+        # data_list = []
															
 
																+        # for e in data_start:
															
 
																+        #     for key in e.keys():
															
 
																+        #         values = e[key]
															
 
																+        #         for sub_e in values:
															
 
																+        #             ele = [key]
															
 
																+        #             ele.extend(sub_e)
															
 
																+        #             data_list.append(ele)
															
 
																+        #     pass
															
 
																+        return {'tag_score': result, 'module_score': module_scores}
															
 
																+        # return {'score': result, 'data': data_list}
															
 
																+
															
 
																+    def behavior_tag_init(self, city, age, people_uuids):
															
 
																+        result = {}
															
 
																+        self.group_type_count = self.marketing_db.select(self.sql_5, [city, city, age, people_uuids])
															
 
																+        # 表名
															
 
																+        for key in self.tag_data:
															
 
																+            values = self.tag_data[key]
															
 
																+            result_sub = {}
															
 
																+            # 标签
															
 
																+            for key_tag_name in values.keys():
															
 
																+                questions = values[key_tag_name]
															
 
																+                elements = []
															
 
																+                for value in questions:
															
 
																+                    question = value[0].split('-')[0]
															
 
																+                    option = value[0].split('-')[1]
															
 
																+                    corr = value[1]
															
 
																+                    fz, fm = self.molecular_value(question, option, city, age, people_uuids)
															
 
																+                    if fm == 0:
															
 
																+                        c = 0
															
 
																+                    else:
															
 
																+                        c = fz / fm
															
 
																+                    elements.append([question, option, corr, fz, fm, c])
															
 
																+                result_sub[key_tag_name] = elements
															
 
																+            result[key] = self.indicator_calculation_d_e(result_sub)
															
 
																+        return result
															
 
																+
															
 
																+    def molecular_value(self, queston, option, city, age, people_uuids):
															
 
																+        # 获取当前父选项包含的子选项id和子题id列表
															
 
																+        result = self.shangju_db.select(self.sql_6, [option, queston])
															
 
																+        sub_option_ids = []
															
 
																+        group_types = []
															
 
																+        for rt in result:
															
 
																+            sub_option_id, sub_question_id, content = rt[0], rt[1], rt[2]
															
 
																+            grouptypes = self.shangju_db.select(self.sql_7, [sub_question_id])
															
 
																+            for g_t in grouptypes:
															
 
																+                if g_t[0] not in group_types:
															
 
																+                    group_types.append(g_t[0])
															
 
																+            sub_option_ids.append(sub_option_id)
															
 
																+        # 计算子选项在答题记录中的点击数
															
 
																+        sub_options_count = 0
															
 
																+        if len(sub_option_ids) > 0:
															
 
																+            result_1 = self.marketing_db.select(self.sql_8, [sub_option_ids, city, city, age, people_uuids])
															
 
																+            sub_options_count = result_1[0][0]
															
 
																+        # 计算父选项包含的子选项对应的子题所在的测试gt包含的点击数。
															
 
																+        denominator_value = 0
															
 
																+        for info in self.group_type_count:
															
 
																+            if info[0] in group_types:
															
 
																+                denominator_value += info[1]
															
 
																+        return sub_options_count, denominator_value
															
 
																+
															
 
																+    def indicator_calculation_d_e(self, data):
															
 
																+        result = {}
															
 
																+        for key in data.keys():
															
 
																+            values = data[key]
															
 
																+            c_list = []
															
 
																+            for x in values:
															
 
																+                _x = x[5]
															
 
																+                if _x is not None and x != 0:
															
 
																+                    c_list.append(_x)
															
 
																+            fm_list = [x[4] for x in values]
															
 
																+            sum_c = sum(fm_list)
															
 
																+            if len(c_list) == 0:
															
 
																+                min_c = 0
															
 
																+            else:
															
 
																+                min_c = min(c_list)
															
 
																+            elements = []
															
 
																+            for value in values:
															
 
																+                _value = []
															
 
																+                c = value[5]
															
 
																+                if sum_c == 0:
															
 
																+                    d = 0
															
 
																+                else:
															
 
																+                    d = c / sum_c
															
 
																+                e = c - min_c
															
 
																+                _value.extend(value)
															
 
																+                _value.append(d)
															
 
																+                _value.append(e)
															
 
																+                elements.append(_value)
															
 
																+            result[key] = elements
															
 
																+        return result
															
 
																+
															
 
																+    def calculation_standard_score(self, datas, city, age, crowd_type):
															
 
																+        scores = {}
															
 
																+        for key_tag_type in datas.keys():
															
 
																+            tag_type_data = datas[key_tag_type]
															
 
																+            scores_sub = []
															
 
																+            for key_tag in tag_type_data.keys():
															
 
																+                key_tag_data = tag_type_data[key_tag]
															
 
																+                print(key_tag)
															
 
																+                print('     父题序号 父选项序号 相关系系数 分子值 分母值 百分比 人数权重 偏离值')
															
 
																+                values = [x[5] for x in key_tag_data]
															
 
																+                min_c = min(values)
															
 
																+                f = min_c
															
 
																+                for value in key_tag_data:
															
 
																+                    print('     {}'.format(value))
															
 
																+                    if value[2] is not None and value[7] is not None:
															
 
																+                        f += float(value[2] * value[7])
															
 
																+                print('     标准分：{}'.format(f))
															
 
																+                scores_sub.append([city, age, key_tag, crowd_type, f])
															
 
																+            scores[key_tag_type] = scores_sub
															
 
																+            # self.shangju_db.add_some(self.sql_9, scores)
															
 
																+        return scores
															
 
																+
															
 
																+    def get_crowd_people(self):
															
 
																+        result = {}
															
 
																+        for type in self.crowd:
															
 
																+            uuids = self.get_people_uuid_by_type(type)
															
 
																+            result[type] = len(uuids)
															
 
																+        return result
															
 
																+
															
 
																+    def get_people_uuid_by_type(self, type):
															
 
																+        uuids = []
															
 
																+        type_sub_option_ids = self.crowd_contain_sub_option_ids[type]
															
 
																+        for people in self.people_sub_option_ids:
															
 
																+            uuid = people[0]
															
 
																+            sub_option_ids = list(map(int, str(people[1]).split(',')))
															
 
																+            # list(set(a).intersection(set(b)))
															
 
																+            if len(list(set(sub_option_ids).intersection(set(type_sub_option_ids)))) > 0 and uuid not in uuids:
															
 
																+                uuids.append(uuid)
															
 
																+        return uuids
															
 
																+
															
 
																+    def get_crowd_contain_sub_option_ids(self):
															
 
																+        """
															
 
																+            获取ABCDEF人群包含的子选项id
															
 
																+        :return:
															
 
																+        """
															
 
																+        infos = {}
															
 
																+        for key in self.crowd_info.keys():
															
 
																+            values = self.crowd_info[key]
															
 
																+            sub_option_ids = []
															
 
																+            for value in values:
															
 
																+                if value is not None:
															
 
																+                    vals = str(value).split('-')
															
 
																+                    option, question = vals[1], vals[0]
															
 
																+                    query_result = self.shangju_db.select(self.sql_6, [option, question])
															
 
																+                    for qr in query_result:
															
 
																+                        sub_option_id, sub_question_id, content = qr[0], qr[1], qr[2]
															
 
																+                        sub_option_ids.append(int(sub_option_id))
															
 
																+            infos[key] = sub_option_ids
															
 
																+        print(infos)
															
 
																+        return infos
															
--- a/mvp/__pycache__/mvp.cpython-36.pyc
+++ b/mvp/__pycache__/mvp.cpython-36.pyc
--- a/mvp/__pycache__/mvp.cpython-37.pyc
+++ b/mvp/__pycache__/mvp.cpython-37.pyc
--- a/mvp/mvp.py
+++ b/mvp/mvp.py
@@ -1,267 +0,0 @@
 
																-from db.mysql_db import MysqlDB
															
 
																-from utils.excel_util import ExcelUtil
															
 
																-
															
 
																-
															
 
																-class Mvp:
															
 
																-    """
															
 
																-     ce mvp 答题数据统计
															
 
																-     城市特例 北京市，上海市， 重庆市，天津市
															
 
																-    """
															
 
																-
															
 
																-    age_dict = {
															
 
																-        '00-04年生': '00后',
															
 
																-        '05-09年生': '05后',
															
 
																-        '50-59年生': '50后',
															
 
																-        '60-69年生': '60后',
															
 
																-        '70-74年生': '70后',
															
 
																-        '75-79年生': '75后',
															
 
																-        '80-84年生': '80后',
															
 
																-        '85-89年生': '85后',
															
 
																-        '90-94年生': '90后',
															
 
																-        '95-99年生': '95后'
															
 
																-    }
															
 
																-
															
 
																-    crowd = ['A', 'B', 'C', 'D', 'E', 'F']
															
 
																-
															
 
																-    # 获取答题记录中城市列表
															
 
																-    sql_1 = 'select city from f_t_daren_score_2 group by city'
															
 
																-
															
 
																-    # 获取父选项和父题id
															
 
																-    sql_2 = 'select a.id, a.content, b.id, b.name from bq_option a left join bq_question b on a.question_id = b.id ' \
															
 
																-            'where a.serial_number = %s and b.serial_number = %s and a.status = b.status = 1 '
															
 
																-    # 数据插入表mvp_question_classification
															
 
																-    sql_3 = 'insert into mvp_question_classification(question_serial_number, question_content, ' \
															
 
																-            'option_serial_number, option_content, tag, corr) values(%s, %s, %s, %s, %s, %s) '
															
 
																-
															
 
																-    # 获取答题人的年龄段集合
															
 
																-    sql_4 = 'select nld from f_t_daren_score_2 group by nld'
															
 
																-
															
 
																-    # 根据城市，年龄段，人群分类统计答题记录数
															
 
																-    sql_5 = 'select group_type, COUNT(uuid) from f_t_daren_score_2 where (city = %s or province = %s) and nld ' \
															
 
																-            '= %s and uuid in %s group by group_type '
															
 
																-
															
 
																-    # 根据父选项获取子选项id列表
															
 
																-    sql_6 = 'SELECT c.id, c.sub_question_id, c.content FROM bq_sub_option c WHERE c.father_id in (SELECT a.id FROM ' \
															
 
																-            'bq_option a ' \
															
 
																-            'LEFT JOIN bq_question b ON a.question_id = b.id WHERE a.serial_number = %s AND b.serial_number = %s ' \
															
 
																-            'and a.status = 1 and b.status = 1) and c.status = 1 '
															
 
																-
															
 
																-    # 根据子题id获取包含子题id的测试
															
 
																-    sql_7 = 'select group_type from bq_testcase where status = 1 and FIND_IN_SET(%s, question_ids)'
															
 
																-
															
 
																-    # 根据子选项id统计答题数
															
 
																-    sql_8 = 'SELECT count(uuid) FROM f_t_daren_score_2 a LEFT JOIN d_shangju_tiku_02 b ON a.sub_question_id = ' \
															
 
																-            'b.sub_question_id AND a.score  = b.score WHERE a.testcase_id = b.testcase_id and b.sub_option_id in %s' \
															
 
																-            'and (a.city = %s or a.province = %s) and a.nld = %s and a.uuid in %s'
															
 
																-
															
 
																-    # 计算值写入表汇总
															
 
																-    sql_9 = 'insert into mvp_standard_score(city, age, tag, crowd_type, score)  VALUES(%s, %s, %s, %s, %s)'
															
 
																-
															
 
																-    # 获取一个uuid下答题的子选项id列表
															
 
																-    sql_10 = 'select  DISTINCT uuid, GROUP_CONCAT(DISTINCT b.sub_option_id)  from f_t_daren_score_2 a left join ' \
															
 
																-             'd_shangju_tiku_02 b on a.sub_question_id = b.sub_question_id and a.score = b.score where a.status = ' \
															
 
																-             'b.status = 1 group by uuid '
															
 
																-
															
 
																-    def __init__(self, path=None):
															
 
																-        self.shangju_db = MysqlDB('shangju')
															
 
																-        self.marketing_db = MysqlDB('marketing_db')
															
 
																-        self.shangju_db.truncate('mvp_standard_score')
															
 
																-        self.tag_data = ExcelUtil(path=path).init_mvp_data()
															
 
																-        self.crowd_info = ExcelUtil(path=path, sheet_name='选项-人群分类对应表').init_crowd_info()
															
 
																-        self.citys = self.init_city()
															
 
																-        self.age = self.init_age()
															
 
																-        self.people_sub_option_ids = self.marketing_db.select(self.sql_10)
															
 
																-        self.crowd_contain_sub_option_ids = self.get_crowd_contain_sub_option_ids()
															
 
																-
															
 
																-    def init_city(self):
															
 
																-        """
															
 
																-            获取答题数据中的城市。
															
 
																-        :return:
															
 
																-        """
															
 
																-        citys = ['北京市', '上海市', '重庆市', '天津市']
															
 
																-        citys_info = self.marketing_db.select(self.sql_1)
															
 
																-        citys.extend([x[0] for x in citys_info if x[0] is not None])
															
 
																-        return citys
															
 
																-
															
 
																-    def write_tag(self, city=None, age=None, crowd=None):
															
 
																-        """
															
 
																-            将excel中的配置信息写入到数据库表中
															
 
																-        :return:
															
 
																-        """
															
 
																-        # datas = []
															
 
																-        # for key in self.tag_data.keys():
															
 
																-        #     values = self.tag_data[key]
															
 
																-        #     for value in values:
															
 
																-        #         question = value[0].split('-')[0]
															
 
																-        #         option = value[0].split('-')[1]
															
 
																-        #         corr = value[1]
															
 
																-        #         data = self.shangju_db.select(self.sql_2, [option, question])
															
 
																-        #         if len(data) > 0:
															
 
																-        #             print([question, option, data[0][3], data[0][1], key, corr])
															
 
																-        #             datas.append([question, option, data[0][3], data[0][1], key, corr])
															
 
																-        # self.shangju_db.truncate('mvp_question_classification')
															
 
																-        # self.shangju_db.add_some(self.sql_3, datas)
															
 
																-        result = self.city_age_crowd(city, age, crowd)
															
 
																-        print('update finished!!!')
															
 
																-        return result
															
 
																-
															
 
																-    def init_age(self):
															
 
																-        """
															
 
																-           获取答题数据中的年龄
															
 
																-        """
															
 
																-        age_info = self.marketing_db.select(self.sql_4)
															
 
																-        # print([x[0] for x in age_info])
															
 
																-        return [x[0] for x in age_info if x[0] is not None]
															
 
																-
															
 
																-    def city_age_crowd(self, city=None, age=None, crowd=None):
															
 
																-        result = []
															
 
																-        if city is not None and age is not None and crowd is not None:
															
 
																-            print('获取指定城市，年龄段，人群类型的数据...')
															
 
																-            people_uuids = self.get_people_uuid_by_type(crowd)
															
 
																-            if len(people_uuids) > 0:
															
 
																-                print('{}-{}-{}'.format(city, age, crowd))
															
 
																-                datas = self.behavior_tag_init(city, age, people_uuids)
															
 
																-                result.extend(self.calculation_standard_score(datas, city, age, crowd))
															
 
																-            pass
															
 
																-        else:
															
 
																-            print('获取所有case的数据...')
															
 
																-            for city in self.citys:
															
 
																-                for age in self.age:
															
 
																-                    if city != '上海市' and age != '85-89年生':
															
 
																-                        for crowd_type in self.crowd:
															
 
																-                            # print(' {}{}'.format(city, age))
															
 
																-                            people_uuids = self.get_people_uuid_by_type(crowd_type)
															
 
																-                            if len(people_uuids) > 0:
															
 
																-                                print('{}-{}-{}'.format(city, age, crowd_type))
															
 
																-                                datas = self.behavior_tag_init(city, age, people_uuids)
															
 
																-                                result.extend(self.calculation_standard_score(datas, city, age, crowd_type))
															
 
																-        return result
															
 
																-
															
 
																-    def behavior_tag_init(self, city, age, people_uuids):
															
 
																-        result = {}
															
 
																-        self.group_type_count = self.marketing_db.select(self.sql_5, [city, city, age, people_uuids])
															
 
																-        for key in self.tag_data:
															
 
																-            values = self.tag_data[key]
															
 
																-            elements = []
															
 
																-            for value in values:
															
 
																-                question = value[0].split('-')[0]
															
 
																-                option = value[0].split('-')[1]
															
 
																-                corr = value[1]
															
 
																-                fz, fm = self.molecular_value(question, option, city, age, people_uuids)
															
 
																-                if fm == 0:
															
 
																-                    c = 0
															
 
																-                else:
															
 
																-                    c = fz / fm
															
 
																-                elements.append([question, option, corr, fz, fm, c])
															
 
																-            result[key] = elements
															
 
																-        return self.indicator_calculation_d_e(result)
															
 
																-
															
 
																-    def molecular_value(self, queston, option, city, age, people_uuids):
															
 
																-        # 获取当前父选项包含的子选项id和子题id列表
															
 
																-        result = self.shangju_db.select(self.sql_6, [option, queston])
															
 
																-        sub_option_ids = []
															
 
																-        group_types = []
															
 
																-        for rt in result:
															
 
																-            sub_option_id, sub_question_id, content = rt[0], rt[1], rt[2]
															
 
																-            grouptypes = self.shangju_db.select(self.sql_7, [sub_question_id])
															
 
																-            for g_t in grouptypes:
															
 
																-                if g_t[0] not in group_types:
															
 
																-                    group_types.append(g_t[0])
															
 
																-            sub_option_ids.append(sub_option_id)
															
 
																-        # 计算子选项在答题记录中的点击数
															
 
																-
															
 
																-        sub_options_count = 0
															
 
																-        if len(sub_option_ids) > 0:
															
 
																-            result_1 = self.marketing_db.select(self.sql_8, [sub_option_ids, city, city, age, people_uuids])
															
 
																-            sub_options_count = result_1[0][0]
															
 
																-        # 计算父选项包含的子选项对应的子题所在的测试gt包含的点击数。
															
 
																-        denominator_value = 0
															
 
																-        for info in self.group_type_count:
															
 
																-            if info[0] in group_types:
															
 
																-                denominator_value += info[1]
															
 
																-        return sub_options_count, denominator_value
															
 
																-
															
 
																-    def indicator_calculation_d_e(self, data):
															
 
																-        result = {}
															
 
																-        for key in data.keys():
															
 
																-            values = data[key]
															
 
																-            c_list = [x[5] for x in values]
															
 
																-            fm_list = [x[4] for x in values]
															
 
																-            sum_c = sum(fm_list)
															
 
																-            min_c = min(c_list)
															
 
																-            elements = []
															
 
																-            for value in values:
															
 
																-                _value = []
															
 
																-                c = value[5]
															
 
																-                if sum_c == 0:
															
 
																-                    d = 0
															
 
																-                else:
															
 
																-                    d = c / sum_c
															
 
																-                e = c - min_c
															
 
																-                _value.extend(value)
															
 
																-                _value.append(d)
															
 
																-                _value.append(e)
															
 
																-                elements.append(_value)
															
 
																-            result[key] = elements
															
 
																-        return result
															
 
																-
															
 
																-    def calculation_standard_score(self, datas, city, age, crowd_type):
															
 
																-        scores = []
															
 
																-        for key in datas.keys():
															
 
																-            print(key)
															
 
																-            print('     父题序号 父选项序号 相关系系数 分子值 分母值 百分比 人数权重 偏离值')
															
 
																-            values = [x[5] for x in datas[key]]
															
 
																-            min_c = min(values)
															
 
																-            f = min_c
															
 
																-            for value in datas[key]:
															
 
																-                print('     {}'.format(value))
															
 
																-                if value[2] is not None and value[7] is not None:
															
 
																-                    f += float(value[2] * value[7])
															
 
																-            print('     标准分：{}'.format(f))
															
 
																-            scores.append([city, age, key, crowd_type, f])
															
 
																-        # self.shangju_db.add_some(self.sql_9, scores)
															
 
																-        return scores
															
 
																-
															
 
																-    def get_crowd_people(self):
															
 
																-        result = {}
															
 
																-        for type in self.crowd:
															
 
																-            uuids = self.get_people_uuid_by_type(type)
															
 
																-            result[type] = len(uuids)
															
 
																-        return result
															
 
																-
															
 
																-    def get_people_uuid_by_type(self, type):
															
 
																-        # 获取每个答题者所答题的子选项id
															
 
																-        uuids = []
															
 
																-        type_sub_option_ids = self.crowd_contain_sub_option_ids[type]
															
 
																-        for people in self.people_sub_option_ids:
															
 
																-            uuid = people[0]
															
 
																-            sub_option_ids = str(people[1]).split(',')
															
 
																-            # list(set(a).intersection(set(b)))
															
 
																-            if len(list(set(sub_option_ids).intersection(set(type_sub_option_ids)))) > 0:
															
 
																-                uuids.append(uuid)
															
 
																-        return uuids
															
 
																-
															
 
																-    def get_crowd_contain_sub_option_ids(self):
															
 
																-        """
															
 
																-            获取ABCDEF人群包含的子选项id
															
 
																-        :return:
															
 
																-        """
															
 
																-        infos = {}
															
 
																-        for key in self.crowd_info.keys():
															
 
																-            values = self.crowd_info[key]
															
 
																-            sub_option_ids = []
															
 
																-            for value in values:
															
 
																-                if value is not None:
															
 
																-                    vals = str(value).split('-')
															
 
																-                    option, question = vals[1], vals[0]
															
 
																-                    query_result = self.shangju_db.select(self.sql_6, [option, question])
															
 
																-                    for qr in query_result:
															
 
																-                        sub_option_id, sub_question_id, content = qr[0], qr[1], qr[2]
															
 
																-                        sub_option_ids.append(sub_option_id)
															
 
																-            infos[key] = sub_option_ids
															
 
																-        return infos
															
 
																-
															
 
																-
															
 
																-if __name__ == '__main__':
															
 
																-    mvp = Mvp()
															
 
																-    mvp.write_tag()
															
--- a/db/mysql_db.py
+++ b/db/mysql_db.py
@@ -10,8 +10,10 @@ class MysqlDB:
 
																     def __init__(self, db_name):
															
 
																         self.db_name = db_name
															
 
																-        self.con = ps.connect(host='192.168.0.13', port=3306, user='root', password='elab@123',
															
 
																-                              db=self.db_name, charset='utf8')
															
 
																+        # self.con = ps.connect(host='172.19.189.136', port=3306, user='bi_etl', password='XPtpswuU5lwGo4kx',
															
 
																+        #                       db=self.db_name, charset='utf8')
															
 
																+        self.con = ps.connect(host='192.168.0.13', port=3306, user='root', password='elab@123'
															
 
																+                              , db=self.db_name, charset='utf8')
															
 
																         self.cursor = self.con.cursor()
															
 
																     def show_tables(self):
															
@@ -48,13 +50,4 @@ class MysqlDB:
 
																     def close(self):
															
 
																         self.cursor.close()
															
 
																-        self.con.close()
															
 
																-
															
 
																-
															
 
																-if __name__ == '__main__':
															
 
																-    mysql_db = MysqlDB('marketing_db')
															
 
																-    # sql = 'select * from bq_question a left join bq_option b on a.id = b.question_id where a.status = 1 and b.status = 1'
															
 
																-    sql = 'select city from f_t_daren_score_2 group by city'
															
 
																-    result = mysql_db.select(sql)
															
 
																-    for rt in result:
															
 
																-        print(rt)
															
 
																+        self.con.close()
															
--- a/resources/mvp.sql
+++ b/resources/mvp.sql
@@ -1,30 +1,16 @@
 
																-create table `mvp_standard_score` (
															
 
																-    `id` int(11) NOT NULL AUTO_INCREMENT COMMENT 'id',
															
 
																-    `score` VARCHAR(10) NOT NULL COMMENT '标准分',
															
 
																-	`city` VARCHAR(10) DEFAULT NULL COMMENT '城市',
															
 
																-	`age` varchar(10) default NULL COMMENT '年龄',
															
 
																-    `tag` VARCHAR(10) DEFAULT NULL COMMENT '标签',
															
 
																-	`status` int(11) DEFAULT '1' COMMENT '1:EFFECTIVE:有效\r\n            -1:INVALID:无效',
															
 
																-    `created` datetime DEFAULT NULL COMMENT '创建时间',
															
 
																-    `creator` varchar(100) DEFAULT NULL COMMENT '创建人',
															
 
																-    `updated` datetime DEFAULT NULL COMMENT '修改时间',
															
 
																-    `updator` varchar(100) DEFAULT NULL COMMENT '修改人',
															
 
																-    PRIMARY KEY (`id`)
															
 
																-)ENGINE=InnoDB AUTO_INCREMENT=1 DEFAULT CHARSET=utf8mb4 COMMENT='mvp标准分'
															
 
																-
															
 
																-
															
 
																-create table `mvp_question_classification` (
															
 
																-    `id` int(11) NOT NULL AUTO_INCREMENT COMMENT 'id',
															
 
																-	`tag` VARCHAR(50) DEFAULT NULL COMMENT '标签名',
															
 
																-	`question_serial_number` varchar(50) DEFAULT NULL COMMENT '父题编号',
															
 
																-	`option_serial_number` varchar(50) DEFAULT NULL COMMENT '父选项编号',
															
 
																-	`question_content` VARCHAR(50) DEFAULT NULL COMMENT '父题内容',
															
 
																-	`option_content` VARCHAR(50) DEFAULT NULL COMMENT '父选项内容',
															
 
																-	`corr` DOUBLE(16,2) DEFAULT NULL COMMENT '关联度系数',
															
 
																-    `status` int(11) DEFAULT '1' COMMENT '1:EFFECTIVE:有效,-1:INVALID:无效',
															
 
																-    `created` datetime DEFAULT NULL COMMENT '创建时间',
															
 
																-    `creator` varchar(100) DEFAULT NULL COMMENT '创建人',
															
 
																-    `updated` datetime DEFAULT NULL COMMENT '修改时间',
															
 
																-    `updator` varchar(100) DEFAULT NULL COMMENT '修改人',
															
 
																-	PRIMARY KEY (`id`)
															
 
																-) ENGINE=InnoDB AUTO_INCREMENT=1 DEFAULT CHARSET=utf8mb4 COMMENT='mvp父题分类'
															
 
																+CREATE TABLE `mvp_crowd_info_module` (
															
 
																+  `id` int(11) NOT NULL AUTO_INCREMENT COMMENT 'id',
															
 
																+  `crowd_info_id` int(11) DEFAULT NULL COMMENT '用户人群信息id',
															
 
																+  `module_name` varchar(50) DEFAULT NULL COMMENT '模块名称',
															
 
																+  `default_value` float(5,2) DEFAULT NULL COMMENT '原始数值',
															
 
																+  `standard_value` float(5,2) DEFAULT NULL COMMENT '标准值',
															
 
																+  `content` varchar(50) DEFAULT NULL COMMENT '内容',
															
 
																+  `url` varchar(300) DEFAULT NULL COMMENT '链接',
															
 
																+  `remarks` varchar(500) DEFAULT NULL COMMENT '备注',
															
 
																+  `status` int(11) DEFAULT '1' COMMENT '1:EFFECTIVE:有效 -1:INVALID:无效',
															
 
																+  `created` datetime DEFAULT NULL COMMENT '创建时间',
															
 
																+  `creator` varchar(100) DEFAULT NULL COMMENT '创建人',
															
 
																+  `updated` datetime DEFAULT NULL COMMENT '修改时间',
															
 
																+  `updator` varchar(100) DEFAULT NULL COMMENT '修改人',
															
 
																+  PRIMARY KEY (`id`)
															
 
																+) ENGINE=InnoDB AUTO_INCREMENT=1 DEFAULT CHARSET=utf8mb4 COMMENT='模块分数'
															
--- a/resources/mvp.xlsx
+++ b/resources/mvp.xlsx
--- a/resources/行为与模块分值汇总.xlsx
+++ b/resources/行为与模块分值汇总.xlsx
--- a/start_shell.sh
+++ b/start_shell.sh
@@ -1,3 +1,5 @@
 
																 #!/bin/bash
															
 
																 # 开发环境部署
															
 
																 python3 flask_app.py >>/tmp/huxingbao.log 2>&1 &
															
 
																+# 生产环境部署方式，使用gunicorn进行部署。
															
 
																+# gunicorn -w 1 -b 0.0.0.0:5001 service:app
															
--- a/utils/__pycache__/excel_util.cpython-37.pyc
+++ b/utils/__pycache__/excel_util.cpython-37.pyc