example/gluon/lipnet/utils/align.py - mxnet - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.

 """
 Module: align
 This is used when the data is genrated by LipsDataset
 """

 import numpy as np
 from .common import word_to_vector


 class Align(object):
     """
     Preprocess for Align
     """
     skip_list = ['sil', 'sp']

     def __init__(self, align_path):
         self.build(align_path)

     def build(self, align_path):
         """
         Build the align array
         """
         file = open(align_path, 'r')
         lines = file.readlines()
         file.close()
         # words: list([op, ed, word])
         words = []
         for line in lines:
             _op, _ed, word = line.strip().split(' ')
             if word not in Align.skip_list:
                 words.append((int(_op), int(_ed), word))
         self.words = words
         self.n_words = len(words)
         self.sentence_str = " ".join([w[2] for w in self.words])
         self.sentence_length = len(self.sentence_str)

     def sentence(self, padding=75):
         """
         Get sentence
         """
         vec = word_to_vector(self.sentence_str)
         vec += [-1] * (padding - self.sentence_length)
         return np.array(vec, dtype=np.int32)

     def word(self, _id, padding=75):
         """
         Get words
         """
         word = self.words[_id][2]
         vec = word_to_vector(word)
         vec += [-1] * (padding - len(vec))
         return np.array(vec, dtype=np.int32)

     def word_length(self, _id):
         """
         Get the length of words
         """
         return len(self.words[_id][2])

     def word_frame_pos(self, _id):
         """
         Get the position of words
         """
         left = int(self.words[_id][0]/1000)
         right = max(left+1, int(self.words[_id][1]/1000))
         return (left, right)
	# Licensed to the Apache Software Foundation (ASF) under one
	# or more contributor license agreements. See the NOTICE file
	# distributed with this work for additional information
	# regarding copyright ownership. The ASF licenses this file
	# to you under the Apache License, Version 2.0 (the
	# "License"); you may not use this file except in compliance
	# with the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing,
	# software distributed under the License is distributed on an
	# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	# KIND, either express or implied. See the License for the
	# specific language governing permissions and limitations
	# under the License.

	"""
	Module: align
	This is used when the data is genrated by LipsDataset
	"""

	import numpy as np
	from .common import word_to_vector


	class Align(object):
	"""
	Preprocess for Align
	"""
	skip_list = ['sil', 'sp']

	def __init__(self, align_path):
	self.build(align_path)

	def build(self, align_path):
	"""
	Build the align array
	"""
	file = open(align_path, 'r')
	lines = file.readlines()
	file.close()
	# words: list([op, ed, word])
	words = []
	for line in lines:
	_op, _ed, word = line.strip().split(' ')
	if word not in Align.skip_list:
	words.append((int(_op), int(_ed), word))
	self.words = words
	self.n_words = len(words)
	self.sentence_str = " ".join([w[2] for w in self.words])
	self.sentence_length = len(self.sentence_str)

	def sentence(self, padding=75):
	"""
	Get sentence
	"""
	vec = word_to_vector(self.sentence_str)
	vec += [-1] * (padding - self.sentence_length)
	return np.array(vec, dtype=np.int32)

	def word(self, _id, padding=75):
	"""
	Get words
	"""
	word = self.words[_id][2]
	vec = word_to_vector(word)
	vec += [-1] * (padding - len(vec))
	return np.array(vec, dtype=np.int32)

	def word_length(self, _id):
	"""
	Get the length of words
	"""
	return len(self.words[_id][2])

	def word_frame_pos(self, _id):
	"""
	Get the position of words
	"""
	left = int(self.words[_id][0]/1000)
	right = max(left+1, int(self.words[_id][1]/1000))
	return (left, right)