Added small dataset
This commit is contained in:
parent
3f465991f0
commit
d1ff88da82
BIN
Assets/Dataset/1-hop/curated/corpus.txt
(Stored with Git LFS)
Normal file
BIN
Assets/Dataset/1-hop/curated/corpus.txt
(Stored with Git LFS)
Normal file
Binary file not shown.
BIN
Assets/Dataset/1-hop/small/corpus.txt
(Stored with Git LFS)
Normal file
BIN
Assets/Dataset/1-hop/small/corpus.txt
(Stored with Git LFS)
Normal file
Binary file not shown.
BIN
Assets/Dataset/1-hop/small/rdf_completation.csv
(Stored with Git LFS)
Normal file
BIN
Assets/Dataset/1-hop/small/rdf_completation.csv
(Stored with Git LFS)
Normal file
Binary file not shown.
|
BIN
Assets/Dataset/1-hop/small/rdf_text.csv
(Stored with Git LFS)
Normal file
BIN
Assets/Dataset/1-hop/small/rdf_text.csv
(Stored with Git LFS)
Normal file
Binary file not shown.
|
@ -45,9 +45,8 @@ def normalize_sequence(
|
|||||||
pad_token: int,
|
pad_token: int,
|
||||||
end_token: int,
|
end_token: int,
|
||||||
) -> tuple[list[int], list[bool]]:
|
) -> tuple[list[int], list[bool]]:
|
||||||
|
new_sequence = truncate_sequence(sequence, max_length, end_token)
|
||||||
new_sequence = pad_sequence(sequence, max_length, pad_token)
|
new_sequence = pad_sequence(new_sequence, max_length, pad_token)
|
||||||
new_sequence = truncate_sequence(new_sequence, max_length, end_token)
|
|
||||||
PADDING_MASK = create_padding_mask(new_sequence, pad_token)
|
PADDING_MASK = create_padding_mask(new_sequence, pad_token)
|
||||||
|
|
||||||
return (new_sequence, PADDING_MASK)
|
return (new_sequence, PADDING_MASK)
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user