Skip to content
This repository has been archived by the owner on May 9, 2024. It is now read-only.

Latest commit

 

History

History
51 lines (49 loc) · 1.32 KB

aihub_koen_sci.md

File metadata and controls

51 lines (49 loc) · 1.32 KB

AiHub Traslation - Science Field

Sample

name: aihub_koen_sci
fullname: AiHub Traslation - Science Field
lang: ko
category: translation
description: AIHub Korean to English Translation Corpus - Science Field
license: Attribution-NonCommercial (CC-By-NC v3)
homepage: https://aihub.or.kr
version: 1.0.0
num_docs: 1344631
num_docs_before_processing: 1344631
num_segments: 1344631
num_sents: 1344631
num_words: 17720448
size_in_bytes: 172404050
num_bytes_before_processing: 172422911
size_in_human_bytes: 164.42 MiB
data_files_modified: '2022-02-14 12:25:30'
meta_files_modified: '2022-01-29 09:34:28'
info_updated: '2022-02-26 03:06:08'
data_files:
  train: aihub_koen_sci-train.parquet
  test: aihub_koen_sci-test.parquet
meta_files:
  train: meta-aihub_koen_sci-train.parquet
  test: meta-aihub_koen_sci-test.parquet
features:
  columns:
    id: id
    text: text
  data:
    id: int
    text: str
  meta:
    id: int
    sn: str
    file_name: str
    data_set: stgr
    domain: str
    subdomain: str
    source: str
    style: str
    english: str