mongodb.py

from chatterbot.storage import StorageAdapter

class Query(object):

    def __init__(self, query={}):

        self.query = query

    def value(self):

        return self.query.copy()

    def raw(self, data):

        query = self.query.copy()

        query.update(data)

        return Query(query)

    def statement_text_equals(self, statement_text):

        query = self.query.copy()

        query['text'] = statement_text

        return Query(query)

    def statement_text_not_in(self, statements):

        query = self.query.copy()

        if 'text' not in query:

            query['text'] = {}

        if '$nin' not in query['text']:

            query['text']['$nin'] = []

        query['text']['$nin'].extend(statements)

        return Query(query)

    def statement_response_list_contains(self, statement_text):

        query = self.query.copy()

        if 'in_response_to' not in query:

            query['in_response_to'] = {}

        if '$elemMatch' not in query['in_response_to']:

            query['in_response_to']['$elemMatch'] = {}

        query['in_response_to']['$elemMatch']['text'] = statement_text

        return Query(query)

    def statement_response_list_equals(self, response_list):

        query = self.query.copy()

        query['in_response_to'] = response_list

        return Query(query)

class MongoDatabaseAdapter(StorageAdapter):

    """

    The MongoDatabaseAdapter is an interface that allows

    ChatterBot to store statements in a MongoDB database.

    :keyword database: The name of the database you wish to connect to.

    :type database: str

    .. code-block:: python

       database='chatterbot-database'

    :keyword database_uri: The URI of a remote instance of MongoDB.

    :type database_uri: str

    .. code-block:: python

       database_uri='mongodb://example.com:8100/'

    """

    def __init__(self, **kwargs):

        super(MongoDatabaseAdapter, self).__init__(**kwargs)

        from pymongo import MongoClient

        from pymongo.errors import OperationFailure

        self.database_name = self.kwargs.get(

            'database', 'chatterbot-database'

        )

        self.database_uri = self.kwargs.get(

            'database_uri', 'mongodb://localhost:27017/'

        )

        # Use the default host and port

        self.client = MongoClient(self.database_uri)

        # Increase the sort buffer to 42M if possible

        try:

            self.client.admin.command({'setParameter': 1, 'internalQueryExecMaxBlockingSortBytes': 44040192})

        except OperationFailure:

            pass

        # Specify the name of the database

        self.database = self.client[self.database_name]

        # The mongo collection of statement documents

        self.statements = self.database['statements']

        # The mongo collection of conversation documents

        self.conversations = self.database['conversations']

        # Set a requirement for the text attribute to be unique

        self.statements.create_index('text', unique=True)

        self.base_query = Query()

    def get_statement_model(self):

        """

        Return the class for the statement model.

        """

        from chatterbot.conversation import Statement

        # Create a storage-aware statement

        statement = Statement

        statement.storage = self

        return statement

    def get_response_model(self):

        """

        Return the class for the response model.

        """

        from chatterbot.conversation import Response

        # Create a storage-aware response

        response = Response

        response.storage = self

        return response

    def count(self):

        return self.statements.count()

    def find(self, statement_text):

        Statement = self.get_model('statement')

        query = self.base_query.statement_text_equals(statement_text)

        values = self.statements.find_one(query.value())

        if not values:

            return None

        del values['text']

        # Build the objects for the response list

        values['in_response_to'] = self.deserialize_responses(

            values.get('in_response_to', [])

        )

        return Statement(statement_text, **values)

    def deserialize_responses(self, response_list):

        """

        Takes the list of response items and returns

        the list converted to Response objects.

        """

        Statement = self.get_model('statement')

        Response = self.get_model('response')

        proxy_statement = Statement('')

        for response in response_list:

            text = response['text']

            del response['text']

            proxy_statement.add_response(

                Response(text, **response)

            )

        return proxy_statement.in_response_to

    def mongo_to_object(self, statement_data):

        """

        Return Statement object when given data

        returned from Mongo DB.

        """

        Statement = self.get_model('statement')

        statement_text = statement_data['text']

        del statement_data['text']

        statement_data['in_response_to'] = self.deserialize_responses(

            statement_data.get('in_response_to', [])

        )

        return Statement(statement_text, **statement_data)

    def filter(self, **kwargs):

        """

        Returns a list of statements in the database

        that match the parameters specified.

        """

        import pymongo

        query = self.base_query

        order_by = kwargs.pop('order_by', None)

        # Convert Response objects to data

        if 'in_response_to' in kwargs:

            serialized_responses = []

            for response in kwargs['in_response_to']:

                serialized_responses.append({'text': response})

            query = query.statement_response_list_equals(serialized_responses)

            del kwargs['in_response_to']

        if 'in_response_to__contains' in kwargs:

            query = query.statement_response_list_contains(

                kwargs['in_response_to__contains']

            )

            del kwargs['in_response_to__contains']

        query = query.raw(kwargs)

        matches = self.statements.find(query.value())

        if order_by:

            direction = pymongo.ASCENDING

            # Sort so that newer datetimes appear first

            if order_by == 'created_at':

                direction = pymongo.DESCENDING

            matches = matches.sort(order_by, direction)

        results = []

        for match in list(matches):

            results.append(self.mongo_to_object(match))

        return results

    def update(self, statement):

        from pymongo import UpdateOne

        from pymongo.errors import BulkWriteError

        data = statement.serialize()

        operations = []

        update_operation = UpdateOne(

            {'text': statement.text},

            {'$set': data},

            upsert=True

        )

        operations.append(update_operation)

        # Make sure that an entry for each response is saved

        for response_dict in data.get('in_response_to', []):

            response_text = response_dict.get('text')

            # $setOnInsert does nothing if the document is not created

            update_operation = UpdateOne(

                {'text': response_text},

                {'$set': response_dict},

                upsert=True

            )

            operations.append(update_operation)

        try:

            self.statements.bulk_write(operations, ordered=False)

        except BulkWriteError as bwe:

            # Log the details of a bulk write error

            self.logger.error(str(bwe.details))

        return statement

    def create_conversation(self):

        """

        Create a new conversation.

        """

        conversation_id = self.conversations.insert_one({}).inserted_id

        return conversation_id

    def get_latest_response(self, conversation_id):

        """

        Returns the latest response in a conversation if it exists.

        Returns None if a matching conversation cannot be found.

        """

        from pymongo import DESCENDING

        statements = list(self.statements.find({

            'conversations.id': conversation_id

        }).sort('conversations.created_at', DESCENDING))

        if not statements:

            return None

        return self.mongo_to_object(statements[-2])

    def add_to_conversation(self, conversation_id, statement, response):

        """

        Add the statement and response to the conversation.

        """

        from datetime import datetime, timedelta

        self.statements.update_one(

            {

                'text': statement.text

            },

            {

                '$push': {

                    'conversations': {

                        'id': conversation_id,

                        'created_at': datetime.utcnow()

                    }

                }

            }

        )

        self.statements.update_one(

            {

                'text': response.text

            },

            {

                '$push': {

                    'conversations': {

                        'id': conversation_id,

                        # Force the response to be at least one millisecond after the input statement

                        'created_at': datetime.utcnow() + timedelta(milliseconds=1)

                    }

                }

            }

        )

    def get_random(self):

        """

        Returns a random statement from the database

        """

        from random import randint

        count = self.count()

        if count < 1:

            raise self.EmptyDatabaseException()

        random_integer = randint(0, count - 1)

        statements = self.statements.find().limit(1).skip(random_integer)

        return self.mongo_to_object(list(statements)[0])

    def remove(self, statement_text):

        """

        Removes the statement that matches the input text.

        Removes any responses from statements if the response text matches the

        input text.

        """

        for statement in self.filter(in_response_to__contains=statement_text):

            statement.remove_response(statement_text)

            self.update(statement)

        self.statements.delete_one({'text': statement_text})

    def get_response_statements(self):

        """

        Return only statements that are in response to another statement.

        A statement must exist which lists the closest matching statement in the

        in_response_to field. Otherwise, the logic adapter may find a closest

        matching statement that does not have a known response.

        """

        response_query = self.statements.aggregate([{'$group': {'_id': '$in_response_to.text'}}])

        responses = []

        for r in response_query:

            try:

                responses.extend(r['_id'])

            except TypeError:

                pass

        _statement_query = {

            'text': {

                '$in': responses

            }

        }

        _statement_query.update(self.base_query.value())

        statement_query = self.statements.find(_statement_query)

        statement_objects = []

        for statement in list(statement_query):

            statement_objects.append(self.mongo_to_object(statement))

        return statement_objects

    def drop(self):

        """

        Remove the database.

        """

        self.client.drop_database(self.database_name)

mongodb.py的更多相关文章

Python mongoDB 的简单操作
#!/usr/bin/env python # coding:utf-8 # Filename:mongodb.py from pymongo import MongoClient,ASCENDING ...
Python连接MongoDB数据库并执行操作
原文:https://blog.51cto.com/1767340368/2092813 环境设置: [root@mongodb ~]# cat /etc/redhat-release CentOS ...
MongoDB与python 交互
一.安装pymongo 注意 :当同时安装了python2和python3,为区分两者的pip,分别取名为pip2和pip3. 推荐:https://www.cnblogs.com/thunderLL ...
2019-05-25 Python之Mongodb的使用
Mongodb学习总结: one.插入数据pass two.查看数据pass three.修改数据pass four.数据排序pass five.删除数据pass 一.安装Mongodb https: ...
ansible的lookup
lookup路径: /usr/lib/python2.7/site-packages/ansible/plugins/lookup 所有的lookup插件列表cartesian.py dnstxt.p ...
SaltStack介绍及简单配置-第一篇
SaltStack介绍一种全新的基础设施管理方式,部署轻松,在几分钟内可运行起来,扩展性好,很容易管理上万台服务器,速度够快,服务器之间秒级通讯. salt底层采用动态的连接总线, 使其可以用于编配 ...
appium 爬取抖音
1.MongoDB.py import pymongo from pymongo.collection import Collection client = pymongo.MongoClient(h ...
Scrapy的piplines.py存储文件和存储mongodb
一.将数据保存到文件 1.piplines.py文件 import json class TencentPipeline(object): def open_spider(self,spider): ...
py操作mongodb总结
python使用的版本 python3. python操作mongodb使用的是pymongo,安装方法: pip install pymongo 测试 PyMongo 接下来我们可以创建一个测试文件 ...

随机推荐

SpringMVC_01:创建运行环境(Maven)
Maven 环境下配置: 1.新建MavenProject,打包选线根据情况选择jar war和pom jar:打包为jar包,主要用于被其他项目引用 war:打包为war包,可直接运行于服务器 po ...
iOS 5 does not allow to store downloaded data in Documents directory? ios5.0及以后的版本对于下载的文件存储路径有了改变
I have made an application for my client by keeping target iOS as 4. But since the application still ...
泽熙学到的 z
叶展,原泽熙投资总经理助理,现任齐鲁证券资产管理公司总裁助理,齐鲁星空.星汉等集合理财投资经理. 导读:三年前,我加入了泽熙投资,正式成为一名职业投资者.做职业投资者一直是我的理想.在股市中用眼光和头 ...
[置顶] 一个简单好用的zabbix告警信息发送工具
之前使用邮件和短信发送zabbix告警信息,但告警信息无法实时查看或者无法发送,故障无法及时通知运维人员. 后来使用第三方微信接口发送信息,愉快地用了一年多,突然收费了. zabbix告警一直是我的痛 ...
ubuntu下C/C++编程起步
1. 安装VMware虚拟机软件 2. 在VMware中安装linux系统,这里安装的是Ubuntu.(用 VMware 安装 Ubuntu 12.04详细过程图解) 3. ubuntu有自带文本编辑 ...
Drools学习笔记
Drools是一款基于Java的开源规则引擎实现了将业务决策从应用程序中分离出来. 优点: 1.简化系统架构,优化应用 2.提高系统的可维护性和维护成本 3.方便系统的整合 4.减少编写“硬代码”业 ...
AngularJS中选择样式
代码下载:https://files.cnblogs.com/files/xiandedanteng/angularJSSelectClass.rar 要点,{{ctrl.name}}比<spa ...
AngularJS的过滤器示例
代码下载:https://files.cnblogs.com/files/xiandedanteng/angularJSFilter.rar 显示效果: 页面代码: <!DOCTYPE HTML ...
js 输入框增加删除操作
<!DOCTYPE html> <html lang="en"> <head> <meta charset="UTF-8&quo ...
C++必知必会(1)
条款1数据抽象抽象数据类型的用途在于将变成语言扩展到一个特定的问题领域.一般对抽象数据类型的定义须要准训下面步骤: 1. 为类型取一个描写叙述性的名字 2. 列出类型所能运行的操作 ...

mongodb.py

mongodb.py的更多相关文章

随机推荐

热门专题