Apriori算法(C#)

AprioriMethod.cs

using System;

using System.Collections.Generic;

using System.Linq;

using System.Web;

/// <summary>

///AprioriMethod 的摘要说明

/// </summary>

public class AprioriMethod

{

    private readonly static int support = ; // 支持度阈值

    private readonly static double confidence = 0.7; // 置信度阈值

    private readonly static char[] item_Split = { ';' }; // 项之间的分隔符

    private readonly static string itemSplit = ";";

    private readonly static String CON = "->"; // 项之间的分隔符

    private readonly static List<String> transList = new List<String>(); //所有交易

    public AprioriMethod()

    {

        //

        //TODO: 在此处添加构造函数逻辑

        //

        //初始化交易记录

        transList.Add("移动硬盘;电脑;手机;优盘");

        transList.Add("电脑;优盘;");

        transList.Add("电脑;优盘;");

        transList.Add("手机;电脑;移动硬盘;");

        transList.Add("移动硬盘;手机;");

        transList.Add("电脑;手机;");

        transList.Add("移动硬盘;手机;");

        transList.Add("移动硬盘;电脑;手机;优盘;");

        transList.Add("移动硬盘;电脑;手机;");

    }

    public Dictionary<String, int> getFC()   //计算所有频繁项集

    {

        Dictionary<String, int> frequentCollections = new Dictionary<String, int>();//所有的频繁集

        foreach (KeyValuePair<string, int> item in getItem1FC())

        {

            if (frequentCollections.ContainsKey(item.Key))

            {

                frequentCollections.Remove(item.Key);

            }

            frequentCollections.Add(item.Key, item.Value);

        }

        Dictionary<String, int> itemkFcMap = new Dictionary<String, int>();

        foreach (KeyValuePair<string, int> item in getItem1FC())

        {

            itemkFcMap.Add(item.Key, item.Value);

        }

        while (itemkFcMap != null && itemkFcMap.Count != )

        {

            Dictionary<String, int> candidateCollection = getCandidateCollection(itemkFcMap);

            List<String> ccKeySet = candidateCollection.Keys.ToList();

            //对候选集项进行累加计数

            foreach (String trans in transList)

            {

                foreach (String candidate in ccKeySet)

                {

                    bool flag = true; // 用来判断交易中是否出现该候选项，如果出现，计数加1

                    String[] candidateItems = candidate.Split(item_Split, StringSplitOptions.RemoveEmptyEntries);

                    foreach (String candidateItem in candidateItems)

                    {

                        if (trans.IndexOf(candidateItem + itemSplit) == -)

                        {

                            flag = false;

                            break;

                        }

                    }

                    if (flag)

                    {

                        int count = candidateCollection[candidate];

                        candidateCollection.Remove(candidate);

                        candidateCollection.Add(candidate, count + );

                    }

                }

            }

            //从候选集中找到符合支持度的频繁集项

            itemkFcMap.Clear();

            foreach (String candidate in ccKeySet)

            {

                int count = candidateCollection[candidate];

                if (count >= support)

                {

                    itemkFcMap.Add(candidate, count);

                }

            }

            //合并所有频繁集

            foreach (KeyValuePair<string, int> item in itemkFcMap)

            {

                if (frequentCollections.ContainsKey(item.Key))

                {

                    frequentCollections.Remove(item.Key);

                }

                frequentCollections.Add(item.Key, item.Value);

            }

        }

        return frequentCollections;

    }

    private Dictionary<String, int> getItem1FC() //计算所有频繁1项集

    {

        Dictionary<String, int> sItem1Fc = new Dictionary<String, int>();

        Dictionary<String, int> rItem1Fc = new Dictionary<String, int>(); //频繁1项集

        foreach (String trans in transList)

        {

            String[] items = trans.Split(item_Split, StringSplitOptions.RemoveEmptyEntries);

            foreach (String item in items)

            {

                int count;

                if (sItem1Fc.ContainsKey(item + itemSplit))

                {

                    count = sItem1Fc[item + itemSplit];

                    sItem1Fc.Remove(item + itemSplit);

                    sItem1Fc.Add(item + itemSplit, count + );

                }

                else

                {

                    sItem1Fc.Add(item + itemSplit, );

                }

            }

        }

        List<String> keySet = sItem1Fc.Keys.ToList();

        foreach (String key in keySet)

        {

            int count = sItem1Fc[key];

            if (count >= support)

            {

                rItem1Fc.Add(key, count);

            }

        }

        return rItem1Fc;

    }

    private Dictionary<String, int> getCandidateCollection(Dictionary<String, int> itemkFcMap) //生成候选项集

    {

        Dictionary<String, int> candidateCollection = new Dictionary<String, int>();

        List<String> itemkSet1 = itemkFcMap.Keys.ToList();

        List<String> itemkSet2 = itemkFcMap.Keys.ToList();

        foreach (String itemk1 in itemkSet1)

        {

            foreach (String itemk2 in itemkSet2)

            {

                //进行连接

                String[] tmp1 = itemk1.Split(item_Split, StringSplitOptions.RemoveEmptyEntries);

                String[] tmp2 = itemk2.Split(item_Split, StringSplitOptions.RemoveEmptyEntries);

                String c = "";

                if (tmp1.Length == )

                {

                    if (tmp1[].CompareTo(tmp2[]) < )

                    {

                        c = tmp1[] + itemSplit + tmp2[] + itemSplit;

                    }

                }

                else

                {

                    bool flag = true;

                    for (int i = ; i < tmp1.Length - ; i++)

                    {

                        if (!tmp1[i].Equals(tmp2[i]))

                        {

                            flag = false;

                            break;

                        }

                    }

                    if (flag && (tmp1[tmp1.Length - ].CompareTo(tmp2[tmp2.Length - ]) < ))

                    {

                        c = itemk1 + tmp2[tmp2.Length - ] + itemSplit;

                    }

                }

                //进行剪枝

                bool hasInfrequentSubSet = false;

                if (!c.Equals(""))

                {

                    String[] tmpC = c.Split(item_Split, StringSplitOptions.RemoveEmptyEntries);

                    for (int i = ; i < tmpC.Length; i++)

                    {

                        String subC = "";

                        for (int j = ; j < tmpC.Length; j++)

                        {

                            if (i != j)

                            {

                                subC = subC + tmpC[j] + itemSplit;

                            }

                        }

                        if (!itemkFcMap.ContainsKey(subC))

                        {

                            hasInfrequentSubSet = true;

                            break;

                        }

                    }

                }

                else

                {

                    hasInfrequentSubSet = true;

                }

                if (!hasInfrequentSubSet)

                {

                    candidateCollection.Add(c, );

                }

            }

        }

        return candidateCollection;

    }

    public Dictionary<String, Double> getRelationRules(Dictionary<String, int> frequentCollection) //计算关联规则

    {

        Dictionary<String, Double> relationRules = new Dictionary<String, Double>();

        List<String> keySet = frequentCollection.Keys.ToList();

        foreach (String key in keySet)

        {

            double countAll = frequentCollection[key];

            String[] keyItems = key.Split(item_Split, StringSplitOptions.RemoveEmptyEntries);

            if (keyItems.Length > )

            {

                List<String> source = keyItems.ToList();

                //Collections.addAll(source, keyItems);

                List<List<String>> result = new List<List<String>>();

                buildSubSet(source, result); //获得source的所有非空子集

                foreach (List<String> itemList in result)

                {

                    if (itemList.Count < source.Count)

                    {   //只处理真子集

                        List<String> otherList = new List<String>();

                        foreach (String sourceItem in source)

                        {

                            if (!itemList.Contains(sourceItem))

                            {

                                otherList.Add(sourceItem);

                            }

                        }

                        String reasonStr = "";//前置

                        String resultStr = "";//结果

                        foreach (String item in itemList)

                        {

                            reasonStr = reasonStr + item + itemSplit;

                        }

                        foreach (String item in otherList)

                        {

                            resultStr = resultStr + item + itemSplit;

                        }

                        double countReason = frequentCollection[reasonStr];

                        double itemConfidence = countAll / countReason;//计算置信度

                        if (itemConfidence >= confidence)

                        {

                            String rule = reasonStr + CON + resultStr;

                            //relationRules.Remove(rule);

                            relationRules.Add(rule, itemConfidence);

                        }

                    }

                }

            }

        }

        return relationRules;

    }

    private void buildSubSet(List<String> sourceSet, List<List<String>> result) //建立频繁项集的子集

    {

        // 仅有一个元素时，递归终止。此时非空子集仅为其自身，所以直接添加到result中

        if (sourceSet.Count == )

        {

            List<String> set = new List<String>();

            set.Add(sourceSet[]);

            result.Add(set);

        }

        else if (sourceSet.Count > )

        {

            // 当有n个元素时，递归求出前n-1个子集，在于result中

            buildSubSet(sourceSet.Take(sourceSet.Count - ).ToList(), result);

            int size = result.Count;// 求出此时result的长度，用于后面的追加第n个元素时计数

            // 把第n个元素加入到集合中

            List<String> single = new List<String>();

            single.Add(sourceSet[sourceSet.Count - ]);

            result.Add(single);

            // 在保留前面的n-1子集的情况下，把第n个元素分别加到前n个子集中，并把新的集加入到result中;

            // 为保留原有n-1的子集，所以需要先对其进行复制

            List<String> clone;

            for (int i = ; i < size; i++)

            {

                clone = new List<String>();

                foreach (String str in result[i])

                {

                    clone.Add(str);

                }

                clone.Add(sourceSet[sourceSet.Count - ]);

                result.Add(clone);

            }

        }

    }

}

Default.aspx.cs

            AprioriMethod apriori = new AprioriMethod();

            Dictionary<String, int> frequentCollection = apriori.getFC();

            Response.Write("----------------频繁集" + "----------------");

            Response.Write("<br/>");

            foreach (var item in frequentCollection)

            {

                Response.Write(item.Key + "-----" + item.Value);

                Response.Write("<br/>");

            }

            Dictionary<String, Double> relationRules = apriori.getRelationRules(frequentCollection);

            Response.Write("----------------关联规则" + "----------------");

            Response.Write("<br/>");

            foreach (var item in relationRules)

            {

                Response.Write(item.Key + "-----" + item.Value);

                Response.Write("<br/>");

            }

结果：

----------------频繁集----------------

移动硬盘;-----6

电脑;-----7

手机;-----7

优盘;-----4

电脑;移动硬盘;-----4

电脑;手机;-----5

电脑;优盘;-----3

手机;移动硬盘;-----6

电脑;手机;移动硬盘;-----4

----------------关联规则----------------

电脑;->手机;-----0.714285714285714

手机;->电脑;-----0.714285714285714

优盘;->电脑;-----0.75

手机;->移动硬盘;-----0.857142857142857

移动硬盘;->手机;-----1

电脑;手机;->移动硬盘;-----0.8

电脑;移动硬盘;->手机;-----1

Apriori算法(C#)的更多相关文章

Apriori算法的原理与python 实现。
前言:这是一个老故事, 但每次看总是能从中想到点什么.在一家超市里,有一个有趣的现象:尿布和啤酒赫然摆在一起出售.但是这个奇怪的举措却使尿布和啤酒的销量双双增加了.这不是一个笑话,而是发生在美国沃尔玛 ...
#研发解决方案#基于Apriori算法的Nginx+Lua+ELK异常流量拦截方案
郑昀基于杨海波的设计文档创建于2015/8/13 最后更新于2015/8/25 关键词:异常流量.rate limiting.Nginx.Apriori.频繁项集.先验算法.Lua.ELK 本文档 ...
数据挖掘算法（四）Apriori算法
参考文献: 关联分析之Apriori算法
机器学习实战 - 读书笔记(11) - 使用Apriori算法进行关联分析
前言最近在看Peter Harrington写的"机器学习实战",这是我的学习心得,这次是第11章 - 使用Apriori算法进行关联分析. 基本概念关联分析(associat ...
关联规则挖掘之apriori算法
前言: 众所周知,关联规则挖掘是数据挖掘中重要的一部分,如著名的啤酒和尿布的问题.今天要学习的是经典的关联规则挖掘算法--Apriori算法一.算法的基本原理由k项频繁集去导出k+1项频繁集. 二 ...
利用Apriori算法对交通路况的研究
首先简单描述一下Apriori算法:Apriori算法分为频繁项集的产生和规则的产生. Apriori算法频繁项集的产生: 令ck为候选k-项集的集合,而Fk为频繁k-项集的集合. 1.首先通过单遍扫 ...
Apriori算法例子
1 Apriori介绍 Apriori算法使用频繁项集的先验知识,使用一种称作逐层搜索的迭代方法,k项集用于探索(k+1)项集.首先,通过扫描事务(交易)记录,找出所有的频繁1项集,该集合记做L1,然 ...
Apriori算法实例----Weka，R, Using Weka in my javacode
学习数据挖掘工具中,下面使用4种工具来对同一个数据集进行研究. 数据描述:下面这些数据是15个同学选修课程情况,在课程大纲中共有10门课程供学生选择,下面给出具体的选课情况,以ARFF数据文件保存,名 ...
Apriori算法在购物篮分析中的运用
购物篮分析是一个很经典的数据挖掘案例,运用到了Apriori算法.下面从网上下载的一超市某月份的数据库,利用Apriori算法进行管理分析.例子使用Python+MongoDB 处理过程1 数据建模( ...
关于apriori算法的一个简单的例子
apriori算法是关联规则挖掘中很基础也很经典的一个算法,我认为很多教程出现大堆的公式不是很适合一个初学者理解.因此,本文列举一个简单的例子来演示下apriori算法的整个步骤. 下面这个表格是代表 ...

随机推荐

appium初学者，使用之检查appium环境报错Could not detect Mac OS X Version from sw_vers output: '10.12.1’，
这个问题存在的原因就是appium不兼容最新的mac10.12版本. 由于10.12是最新mac版本,appium1.5.3并未提供支持,所以: 在终端输入grep -rl "Could n ...
用 node.js 创建第一个Hello World
如果我们使用PHP来编写后端的代码时,需要Apache(xampp) 或者 Nginx 的HTTP 服务器,并配上 mod_php5 模块和php-cgi.从这个角度看,整个"接收 HTTP ...
每天一个Linux命令 7
常用yum命令1)查询 yum list #查询所有可用软件包列表yum search 关键字 #搜索服务器上所有和关键字相关的包2)安装 yum -y install 包名选项: install 安 ...
Oracle-函数大全
ORACLE函数大全 1．第一讲单行函数和组函数详解 PL/SQL单行函数和组函数详解函数是一种有零个或多个参数并且有一个返回值的程序.在SQL中Oracle内建了一系列函数,这些函数都可被称为 ...
android学习——环境的搭建
1.安装JDK(java开发工具箱) 下载地址:http://www.oracle.com/technetwork/java/javase/downloads/index.html(根据自己需要下载) ...
那些"不务正业"的IT培训公司
前言大四下期了,现在准备找一份Java开发的实习工作,于是在各大网站上投递简历-智联招聘.51job.拉勾网,慧眼识真金的我必然会把培训机构给过滤掉,对于重庆来说招聘实习的公司少之又少,然而是智联招 ...
Beautils工具类实现的原理
关于内省机制和反射机制请看这一篇博客[还没写完,在草稿中]. 先说一下什么叫做 bean 属性,bean 属性指的是 get / set 方法后的名称,而不是类的属性: 比如: private Str ...
KMP算法C语言实现。弄了好久才搞好。。。
我的这个算法中数组的第一位没有像教材中那样用来存数组的大小,所以会有些许的不同. ...
Angular2开发拙见——组件规划篇
本文集中讲讲笔者目前使用ng2来开发项目时对其组件的使用的个人的一些拙劣的经验. 先简单讲讲从ng1到ng2框架下组件的职责与地位: ng1中的一大特色--指令,分为属性型.标签型.css类型和注释型 ...
CF766 E. Mahmoud and a xor trip [预处理][树形dp]
题解: 二营长!你他娘的意大利炮呢? dp[i][j][0]: 从i,跋涉到以i为根的子树的每一个节点,在第j个数位上一共产生了多少个0. dp[i][j][1]: 从i,跋涉到以i为根的子树的每一个 ...

Apriori算法(C#)

Apriori算法(C#)的更多相关文章

随机推荐

热门专题