Skip to content
This repository has been archived by the owner on May 9, 2024. It is now read-only.

Latest commit

 

History

History
50 lines (48 loc) · 1.25 KB

aihub_patent2.md

File metadata and controls

50 lines (48 loc) · 1.25 KB

AIHub Patent Section Summary

Sample

name: aihub_patent2
fullname: AIHub Patent Section Summary
lang: ko
category: paper
description: AIHub/논문자료 요약/특허섹션만
license: Attribution-NonCommercial (CC-By-NC v3)
homepage: https://aihub.or.kr
version: 1.0.0
num_docs: 147674
num_docs_before_processing: 151000
num_segments: 295348
num_sents: 1879909
num_words: 46045036
size_in_bytes: 479383377
num_bytes_before_processing: 489562944
size_in_human_bytes: 457.18 MiB
data_files_modified: '2022-02-21 10:29:24'
meta_files_modified: '2022-02-21 10:26:34'
info_updated: '2022-02-26 03:06:08'
data_files:
  train: aihub_patent2-train.parquet
  test: aihub_patent2-test.parquet
meta_files:
  train: meta-aihub_patent2-train.parquet
  test: meta-aihub_patent2-test.parquet
features:
  columns:
    id: id
    text: text
  data:
    id: int
    text: str
  meta:
    id: int
    split: str
    doc_type: str
    doc_id: str
    title: str
    date: str
    reg_no: str
    ipc: str