Source code for nlpir.native.summary

# coding=utf-8
from nlpir.native.nlpir_base import NLPIRBase
from ctypes import c_char_p, c_int, c_float, create_string_buffer


[docs]class Summary(NLPIRBase): load_mode = NLPIRBase.RTLD_LAZY @property def dll_name(self): return "LJSummary"
[docs] @NLPIRBase.byte_str_transform def init_lib(self, data_path: str, encode: int, license_code: str) -> int: """ Call **DS_Init** :param data_path: :param encode: :param license_code: :return: """ return self.get_func("DS_Init", [c_char_p, c_int, c_char_p], c_int)(data_path, encode, license_code)
[docs] @NLPIRBase.byte_str_transform def exit_lib(self) -> bool: """ Call **DS_Exit** :return: """ self.get_func("DS_Exit", None, None)() return True
[docs] @NLPIRBase.byte_str_transform def get_last_error_msg(self) -> str: """ Call **DS_GetLastErrMsg** :return: """ return self.get_func("DS_GetLastErrorMsg", None, c_char_p)()
[docs] @NLPIRBase.byte_str_transform def single_doc( self, text: str, sum_rate: float = 0.0, sum_len: int = 500, html_tag_remove: int = 0, sentence_count: int = 0 ): """ Call **DS_SingleDoc** 生成单文档摘要, make summarization :param str text: 文档内容 text content :param float sum_rate: 文档摘要占原文百分比(为0.00则不限制) the percentage of summarization length comparing to original text (0.00 represent no limit) :param int sum_len: 用户限定的摘要长度(为0则不限制)The max len of summarization(0 will no limit) :param bool html_tag_remove: 是否需要对原文进行Html标签的去除 remove the html tag or not :param int sentence_count: 用户限定的句子数量 (为0则不限制) :return: 摘要字符串;出错返回空串 the summarization content, get null string if occurs error. """ return self.get_func("DS_SingleDoc", [c_char_p, c_float, c_int, c_int, c_int], c_char_p)( text, c_float(sum_rate), sum_len, sentence_count, html_tag_remove )
[docs] @NLPIRBase.byte_str_transform def single_doc_e( self, text: str, sum_rate: float = 0.0, sum_len: int = 500, html_tag_remove: int = 0, sentence_count: int = 0 ): """ Call **DS_SingleDocE** 生成单文档摘要该函数支持多线程,是多线程安全的, make summarization with threading safe :param str text: 文档内容 text content :param float sum_rate: 文档摘要占原文百分比(为0.00则不限制) the percentage of summarization length comparing to original text (0.00 represent no limit) :param int sum_len: 用户限定的摘要长度(为0则不限制)The max len of summarization(0 will no limit) :param bool html_tag_remove: 是否需要对原文进行Html标签的去除 remove the html tag or not :param int sentence_count: 用户限定的句子数量 (为0则不限制) :return: 摘要字符串;出错返回空串 the summarization content, get null string if occurs error. """ buffer_len = int(len(text) * 3 * (sum_rate if sum_rate > 0.0 else 1)) buffer_len = sum_len if sum_len < buffer_len else buffer_len result = create_string_buffer(buffer_len * 4) result_2 = self.get_func("DS_SingleDocE", [c_char_p, c_char_p, c_float, c_int, c_int])( result, text, c_float(sum_rate), sum_len, sentence_count, html_tag_remove ) return result.value, result_2
[docs] @NLPIRBase.byte_str_transform def file_process( self, text_filename: str, sum_rate: float = 0.0, sum_len: int = 500, html_tag_remove: int = 0, sentence_count: int = 0 ): """ Call **DS_FileProcess** 生成单文档摘要该函数支持多线程,是多线程安全的, make summarization from file with threading safe :param str text_filename: 文档文件路径 text file path :param float sum_rate: 文档摘要占原文百分比(为0.00则不限制) the percentage of summarization length comparing to original text (0.00 represent no limit) :param int sum_len: 用户限定的摘要长度(为0则不限制)The max len of summarization(0 will no limit) :param bool html_tag_remove: 是否需要对原文进行Html标签的去除 remove the html tag or not :param int sentence_count: 用户限定的句子数量 (为0则不限制) :return: 摘要字符串;出错返回空串 the summarization content, get null string if occurs error. """ return self.get_func("DS_FileProcess", [c_char_p, c_float, c_int, c_int], c_char_p)( text_filename, c_float(sum_rate), sum_len, sentence_count, html_tag_remove)