2023-09-27 16:06:32 +08:00
|
|
|
from fields.dataset_fields import dataset_fields
|
2024-01-12 12:34:01 +08:00
|
|
|
from flask_restful import fields
|
2023-09-27 16:06:32 +08:00
|
|
|
from libs.helper import TimestampField
|
|
|
|
|
|
|
|
document_fields = {
|
|
|
|
'id': fields.String,
|
|
|
|
'position': fields.Integer,
|
|
|
|
'data_source_type': fields.String,
|
|
|
|
'data_source_info': fields.Raw(attribute='data_source_info_dict'),
|
|
|
|
'dataset_process_rule_id': fields.String,
|
|
|
|
'name': fields.String,
|
|
|
|
'created_from': fields.String,
|
|
|
|
'created_by': fields.String,
|
|
|
|
'created_at': TimestampField,
|
|
|
|
'tokens': fields.Integer,
|
|
|
|
'indexing_status': fields.String,
|
|
|
|
'error': fields.String,
|
|
|
|
'enabled': fields.Boolean,
|
|
|
|
'disabled_at': TimestampField,
|
|
|
|
'disabled_by': fields.String,
|
|
|
|
'archived': fields.Boolean,
|
|
|
|
'display_status': fields.String,
|
|
|
|
'word_count': fields.Integer,
|
|
|
|
'hit_count': fields.Integer,
|
|
|
|
'doc_form': fields.String,
|
|
|
|
}
|
|
|
|
|
|
|
|
document_with_segments_fields = {
|
|
|
|
'id': fields.String,
|
|
|
|
'position': fields.Integer,
|
|
|
|
'data_source_type': fields.String,
|
|
|
|
'data_source_info': fields.Raw(attribute='data_source_info_dict'),
|
|
|
|
'dataset_process_rule_id': fields.String,
|
|
|
|
'name': fields.String,
|
|
|
|
'created_from': fields.String,
|
|
|
|
'created_by': fields.String,
|
|
|
|
'created_at': TimestampField,
|
|
|
|
'tokens': fields.Integer,
|
|
|
|
'indexing_status': fields.String,
|
|
|
|
'error': fields.String,
|
|
|
|
'enabled': fields.Boolean,
|
|
|
|
'disabled_at': TimestampField,
|
|
|
|
'disabled_by': fields.String,
|
|
|
|
'archived': fields.Boolean,
|
|
|
|
'display_status': fields.String,
|
|
|
|
'word_count': fields.Integer,
|
|
|
|
'hit_count': fields.Integer,
|
|
|
|
'completed_segments': fields.Integer,
|
|
|
|
'total_segments': fields.Integer
|
|
|
|
}
|
|
|
|
|
|
|
|
dataset_and_document_fields = {
|
|
|
|
'dataset': fields.Nested(dataset_fields),
|
|
|
|
'documents': fields.List(fields.Nested(document_fields)),
|
|
|
|
'batch': fields.String
|
|
|
|
}
|
|
|
|
|
|
|
|
document_status_fields = {
|
|
|
|
'id': fields.String,
|
|
|
|
'indexing_status': fields.String,
|
|
|
|
'processing_started_at': TimestampField,
|
|
|
|
'parsing_completed_at': TimestampField,
|
|
|
|
'cleaning_completed_at': TimestampField,
|
|
|
|
'splitting_completed_at': TimestampField,
|
|
|
|
'completed_at': TimestampField,
|
|
|
|
'paused_at': TimestampField,
|
|
|
|
'error': fields.String,
|
|
|
|
'stopped_at': TimestampField,
|
|
|
|
'completed_segments': fields.Integer,
|
|
|
|
'total_segments': fields.Integer,
|
|
|
|
}
|
|
|
|
|
|
|
|
document_status_fields_list = {
|
|
|
|
'data': fields.List(fields.Nested(document_status_fields))
|
|
|
|
}
|