-
Notifications
You must be signed in to change notification settings - Fork 14
/
Copy pathload.py
35 lines (24 loc) · 895 Bytes
/
load.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
# -*- coding: utf-8 -*-
import numpy as np
import cPickle
import random
def atisfold():
f = open('data/data_set.pkl')
train_set, test_set, dicts = cPickle.load(f)
embedding = cPickle.load(open('data/embedding.pkl'))
return train_set, test_set,dicts,embedding
def pad_sentences(sentences, padding_word=0, forced_sequence_length=None):
if forced_sequence_length is None:
sequence_length=max(len(x) for x in sentences)
else:
sequence_length=forced_sequence_length
padded_sentences=[]
for i in xrange(len(sentences)):
sentence=sentences[i]
num_padding=sequence_length-len(sentence)
if num_padding<0:
padded_sentence=sentence[0:sequence_length]
else:
padded_sentence=sentence+[int(padding_word)]*num_padding
padded_sentences.append(padded_sentence)
return padded_sentences