Module conversationkg.sample_data.load

Expand source code
from pkg_resources import resource_string, resource_listdir
import json
import os

from ..conversations import EmailCorpus

from ..kgs import EmailKG, TextKG


def get_mailinglist_list():
    ignore = {"__pycache__", "load.py"}
    return [d for d in resource_listdir(__name__, ".") if not d in ignore]


def load_data_raw(mailinglist_name):
    x = resource_string(__name__, mailinglist_name+'/all.json')
    json_list = json.loads(x)
    return json_list

    
def load_data_as_EmailCorpus(mailinglist_name, n_conversations=-1, **email_corpus_args):
    json_data = load_data_raw(mailinglist_name)[:n_conversations]
    return EmailCorpus.from_email_dicts(json_data, **email_corpus_args)



def load_data_as_EmailKG(mailinglist_name, n_conversations=-1, **kwargs):
    corpus = load_data_as_EmailCorpus(mailinglist_name, n_conversations, **kwargs)
    return EmailKG(corpus)


def load_data_as_TextKG(mailinglist_name, n_conversations=-1, **kwargs):
    corpus = load_data_as_EmailCorpus(mailinglist_name, n_conversations, **kwargs)
    return TextKG(corpus)

Functions

def get_mailinglist_list()
Expand source code
def get_mailinglist_list():
    ignore = {"__pycache__", "load.py"}
    return [d for d in resource_listdir(__name__, ".") if not d in ignore]
def load_data_as_EmailCorpus(mailinglist_name, n_conversations=-1, **email_corpus_args)
Expand source code
def load_data_as_EmailCorpus(mailinglist_name, n_conversations=-1, **email_corpus_args):
    json_data = load_data_raw(mailinglist_name)[:n_conversations]
    return EmailCorpus.from_email_dicts(json_data, **email_corpus_args)
def load_data_as_EmailKG(mailinglist_name, n_conversations=-1, **kwargs)
Expand source code
def load_data_as_EmailKG(mailinglist_name, n_conversations=-1, **kwargs):
    corpus = load_data_as_EmailCorpus(mailinglist_name, n_conversations, **kwargs)
    return EmailKG(corpus)
def load_data_as_TextKG(mailinglist_name, n_conversations=-1, **kwargs)
Expand source code
def load_data_as_TextKG(mailinglist_name, n_conversations=-1, **kwargs):
    corpus = load_data_as_EmailCorpus(mailinglist_name, n_conversations, **kwargs)
    return TextKG(corpus)
def load_data_raw(mailinglist_name)
Expand source code
def load_data_raw(mailinglist_name):
    x = resource_string(__name__, mailinglist_name+'/all.json')
    json_list = json.loads(x)
    return json_list