sdks/python/apache_beam/typehints/schemas.py - beam - Git at Google

 #
 # Licensed to the Apache Software Foundation (ASF) under one or more
 # contributor license agreements.  See the NOTICE file distributed with
 # this work for additional information regarding copyright ownership.
 # The ASF licenses this file to You under the Apache License, Version 2.0
 # (the "License"); you may not use this file except in compliance with
 # the License.  You may obtain a copy of the License at
 #
 #    http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #

 """ Support for mapping python types to proto Schemas and back again.

 Imposes a mapping between common Python types and Beam portable schemas
 (https://s.apache.org/beam-schemas)::

   Python              Schema
   np.int8     <-----> BYTE
   np.int16    <-----> INT16
   np.int32    <-----> INT32
   np.int64    <-----> INT64
   int         ------> INT64
   np.float32  <-----> FLOAT
   np.float64  <-----> DOUBLE
   float       ------> DOUBLE
   bool        <-----> BOOLEAN
   str/unicode <-----> STRING
   bytes       <-----> BYTES
   ByteString  ------> BYTES
   Timestamp   <-----> LogicalType(urn="beam:logical_type:micros_instant:v1")
   Mapping     <-----> MapType
   Sequence    <-----> ArrayType
   NamedTuple  <-----> RowType
   beam.Row    ------> RowType

 Note that some of these mappings are provided as conveniences,
 but they are lossy and will not survive a roundtrip from python to Beam schemas
 and back. For example, the Python type :code:`int` will map to :code:`INT64` in
 Beam schemas but converting that back to a Python type will yield
 :code:`np.int64`.

 :code:`nullable=True` on a Beam :code:`FieldType` is represented in Python by
 wrapping the type in :code:`Optional`.
 """

 # pytype: skip-file

 from __future__ import absolute_import

 from typing import Any
 from typing import ByteString
 from typing import Generic
 from typing import Mapping
 from typing import NamedTuple
 from typing import Optional
 from typing import Sequence
 from typing import TypeVar
 from uuid import uuid4

 import numpy as np
 from past.builtins import unicode

 from apache_beam.portability.api import schema_pb2
 from apache_beam.typehints import row_type
 from apache_beam.typehints.native_type_compatibility import _get_args
 from apache_beam.typehints.native_type_compatibility import _match_is_exactly_mapping
 from apache_beam.typehints.native_type_compatibility import _match_is_optional
 from apache_beam.typehints.native_type_compatibility import _safe_issubclass
 from apache_beam.typehints.native_type_compatibility import extract_optional_type
 from apache_beam.typehints.native_type_compatibility import match_is_named_tuple
 from apache_beam.utils import proto_utils
 from apache_beam.utils.timestamp import Timestamp

 PYTHON_ANY_URN = "beam:logical:pythonsdk_any:v1"


 # Registry of typings for a schema by UUID
 class SchemaTypeRegistry(object):
   def __init__(self):
     self.by_id = {}
     self.by_typing = {}

   def add(self, typing, schema):
     self.by_id[schema.id] = (typing, schema)

   def get_typing_by_id(self, unique_id):
     result = self.by_id.get(unique_id, None)
     return result[0] if result is not None else None

   def get_schema_by_id(self, unique_id):
     result = self.by_id.get(unique_id, None)
     return result[1] if result is not None else None


 SCHEMA_REGISTRY = SchemaTypeRegistry()

 # Bi-directional mappings
 _PRIMITIVES = (
     (np.int8, schema_pb2.BYTE),
     (np.int16, schema_pb2.INT16),
     (np.int32, schema_pb2.INT32),
     (np.int64, schema_pb2.INT64),
     (np.float32, schema_pb2.FLOAT),
     (np.float64, schema_pb2.DOUBLE),
     (unicode, schema_pb2.STRING),
     (bool, schema_pb2.BOOLEAN),
     (bytes, schema_pb2.BYTES),
 )

 PRIMITIVE_TO_ATOMIC_TYPE = dict((typ, atomic) for typ, atomic in _PRIMITIVES)
 ATOMIC_TYPE_TO_PRIMITIVE = dict((atomic, typ) for typ, atomic in _PRIMITIVES)

 # One-way mappings
 PRIMITIVE_TO_ATOMIC_TYPE.update({
     ByteString: schema_pb2.BYTES,
     # Allow users to specify a native int, and use INT64 as the cross-language
     # representation. Technically ints have unlimited precision, but RowCoder
     # should throw an error if it sees one with a bit width > 64 when encoding.
     int: schema_pb2.INT64,
     float: schema_pb2.DOUBLE,
 })

 # Name of the attribute added to user types (existing and generated) to store
 # the corresponding schema ID
 _BEAM_SCHEMA_ID = "_beam_schema_id"


 def named_fields_to_schema(names_and_types):
   # type: (Sequence[Tuple[str, type]]) -> schema_pb2.Schema
   return schema_pb2.Schema(
       fields=[
           schema_pb2.Field(name=name, type=typing_to_runner_api(type))
           for (name, type) in names_and_types
       ],
       id=str(uuid4()))


 def named_fields_from_schema(
     schema):  # (schema_pb2.Schema) -> typing.List[typing.Tuple[unicode, type]]
   return [(field.name, typing_from_runner_api(field.type))
           for field in schema.fields]


 def typing_to_runner_api(type_):
   if match_is_named_tuple(type_):
     schema = None
     if hasattr(type_, _BEAM_SCHEMA_ID):
       schema = SCHEMA_REGISTRY.get_schema_by_id(getattr(type_, _BEAM_SCHEMA_ID))
     if schema is None:
       fields = [
           schema_pb2.Field(
               name=name, type=typing_to_runner_api(type_._field_types[name]))
           for name in type_._fields
       ]
       type_id = str(uuid4())
       schema = schema_pb2.Schema(fields=fields, id=type_id)
       setattr(type_, _BEAM_SCHEMA_ID, type_id)
       SCHEMA_REGISTRY.add(type_, schema)

     return schema_pb2.FieldType(row_type=schema_pb2.RowType(schema=schema))

   # All concrete types (other than NamedTuple sub-classes) should map to
   # a supported primitive type.
   elif type_ in PRIMITIVE_TO_ATOMIC_TYPE:
     return schema_pb2.FieldType(atomic_type=PRIMITIVE_TO_ATOMIC_TYPE[type_])

   elif _match_is_exactly_mapping(type_):
     key_type, value_type = map(typing_to_runner_api, _get_args(type_))
     return schema_pb2.FieldType(
         map_type=schema_pb2.MapType(key_type=key_type, value_type=value_type))

   elif _match_is_optional(type_):
     # It's possible that a user passes us Optional[Optional[T]], but in python
     # typing this is indistinguishable from Optional[T] - both resolve to
     # Union[T, None] - so there's no need to check for that case here.
     result = typing_to_runner_api(extract_optional_type(type_))
     result.nullable = True
     return result

   elif _safe_issubclass(type_, Sequence):
     element_type = typing_to_runner_api(_get_args(type_)[0])
     return schema_pb2.FieldType(
         array_type=schema_pb2.ArrayType(element_type=element_type))

   elif _safe_issubclass(type_, Mapping):
     key_type, value_type = map(typing_to_runner_api, _get_args(type_))
     return schema_pb2.FieldType(
         map_type=schema_pb2.MapType(key_type=key_type, value_type=value_type))

   try:
     logical_type = LogicalType.from_typing(type_)
   except ValueError:
     # Unknown type, just treat it like Any
     return schema_pb2.FieldType(
         logical_type=schema_pb2.LogicalType(urn=PYTHON_ANY_URN))
   else:
     # TODO(bhulette): Add support for logical types that require arguments
     return schema_pb2.FieldType(
         logical_type=schema_pb2.LogicalType(
             urn=logical_type.urn(),
             representation=typing_to_runner_api(
                 logical_type.representation_type())))


 def typing_from_runner_api(fieldtype_proto):
   if fieldtype_proto.nullable:
     # In order to determine the inner type, create a copy of fieldtype_proto
     # with nullable=False and pass back to typing_from_runner_api
     base_type = schema_pb2.FieldType()
     base_type.CopyFrom(fieldtype_proto)
     base_type.nullable = False
     return Optional[typing_from_runner_api(base_type)]

   type_info = fieldtype_proto.WhichOneof("type_info")
   if type_info == "atomic_type":
     try:
       return ATOMIC_TYPE_TO_PRIMITIVE[fieldtype_proto.atomic_type]
     except KeyError:
       raise ValueError(
           "Unsupported atomic type: {0}".format(fieldtype_proto.atomic_type))
   elif type_info == "array_type":
     return Sequence[typing_from_runner_api(
         fieldtype_proto.array_type.element_type)]
   elif type_info == "map_type":
     return Mapping[typing_from_runner_api(fieldtype_proto.map_type.key_type),
                    typing_from_runner_api(fieldtype_proto.map_type.value_type)]
   elif type_info == "row_type":
     schema = fieldtype_proto.row_type.schema
     user_type = SCHEMA_REGISTRY.get_typing_by_id(schema.id)
     if user_type is None:
       from apache_beam import coders

       type_name = 'BeamSchema_{}'.format(schema.id.replace('-', '_'))
       user_type = NamedTuple(
           type_name,
           [(field.name, typing_from_runner_api(field.type))
            for field in schema.fields])

       setattr(user_type, _BEAM_SCHEMA_ID, schema.id)

       # Define a reduce function, otherwise these types can't be pickled
       # (See BEAM-9574)
       def __reduce__(self):
         return (
             _hydrate_namedtuple_instance,
             (schema.SerializeToString(), tuple(self)))

       setattr(user_type, '__reduce__', __reduce__)

       SCHEMA_REGISTRY.add(user_type, schema)
       coders.registry.register_coder(user_type, coders.RowCoder)
     return user_type

   elif type_info == "logical_type":
     if fieldtype_proto.logical_type.urn == PYTHON_ANY_URN:
       return Any
     else:
       return LogicalType.from_runner_api(
           fieldtype_proto.logical_type).language_type()


 def _hydrate_namedtuple_instance(encoded_schema, values):
   return named_tuple_from_schema(
       proto_utils.parse_Bytes(encoded_schema, schema_pb2.Schema))(*values)


 def named_tuple_from_schema(schema):
   return typing_from_runner_api(
       schema_pb2.FieldType(row_type=schema_pb2.RowType(schema=schema)))


 def named_tuple_to_schema(named_tuple):
   return typing_to_runner_api(named_tuple).row_type.schema


 def schema_from_element_type(element_type):  # (type) -> schema_pb2.Schema
   """Get a schema for the given PCollection element_type.

   Returns schema as a list of (name, python_type) tuples"""
   if isinstance(element_type, row_type.RowTypeConstraint):
     # TODO(BEAM-10722): Make sure beam.Row generated schemas are registered and
     # de-duped
     return named_fields_to_schema(element_type._fields)
   elif match_is_named_tuple(element_type):
     return named_tuple_to_schema(element_type)
   else:
     raise TypeError(
         "Attempted to determine schema for unsupported type '%s'" %
         element_type)


 def named_fields_from_element_type(
     element_type):  # (type) -> typing.List[typing.Tuple[unicode, type]]
   return named_fields_from_schema(schema_from_element_type(element_type))


 # Registry of typings for a schema by UUID
 class LogicalTypeRegistry(object):
   def __init__(self):
     self.by_urn = {}
     self.by_logical_type = {}
     self.by_language_type = {}

   def add(self, urn, logical_type):
     self.by_urn[urn] = logical_type
     self.by_logical_type[logical_type] = urn
     self.by_language_type[logical_type.language_type()] = logical_type

   def get_logical_type_by_urn(self, urn):
     return self.by_urn.get(urn, None)

   def get_urn_by_logial_type(self, logical_type):
     return self.by_logical_type.get(logical_type, None)

   def get_logical_type_by_language_type(self, representation_type):
     return self.by_language_type.get(representation_type, None)


 LanguageT = TypeVar('LanguageT')
 RepresentationT = TypeVar('RepresentationT')
 ArgT = TypeVar('ArgT')


 class LogicalType(Generic[LanguageT, RepresentationT, ArgT]):
   _known_logical_types = LogicalTypeRegistry()

   @classmethod
   def urn(cls):
     # type: () -> unicode

     """Return the URN used to identify this logical type"""
     raise NotImplementedError()

   @classmethod
   def language_type(cls):
     # type: () -> type

     """Return the language type this LogicalType encodes.

     The returned type should match LanguageT"""
     raise NotImplementedError()

   @classmethod
   def representation_type(cls):
     # type: () -> type

     """Return the type of the representation this LogicalType uses to encode the
     language type.

     The returned type should match RepresentationT"""
     raise NotImplementedError()

   @classmethod
   def argument_type(cls):
     # type: () -> type

     """Return the type of the argument used for variations of this LogicalType.

     The returned type should match ArgT"""
     raise NotImplementedError(cls)

   def argument(self):
     # type: () -> ArgT

     """Return the argument for this instance of the LogicalType."""
     raise NotImplementedError()

   def to_representation_type(value):
     # type: (LanguageT) -> RepresentationT

     """Convert an instance of LanguageT to RepresentationT."""
     raise NotImplementedError()

   def to_language_type(value):
     # type: (RepresentationT) -> LanguageT

     """Convert an instance of RepresentationT to LanguageT."""
     raise NotImplementedError()

   @classmethod
   def register_logical_type(cls, logical_type_cls):
     """Register an implementation of LogicalType."""
     cls._known_logical_types.add(logical_type_cls.urn(), logical_type_cls)

   @classmethod
   def from_typing(cls, typ):
     # type: (type) -> LogicalType

     """Construct an instance of a registered LogicalType implementation given a
     typing.

     Raises ValueError if no registered LogicalType implementation can encode the
     given typing."""

     logical_type = cls._known_logical_types.get_logical_type_by_language_type(
         typ)
     if logical_type is None:
       raise ValueError("No logical type registered for typing '%s'" % typ)

     return logical_type._from_typing(typ)

   @classmethod
   def _from_typing(cls, typ):
     # type: (type) -> LogicalType

     """Construct an instance of this LogicalType implementation given a typing.
     """
     raise NotImplementedError()

   @classmethod
   def from_runner_api(cls, logical_type_proto):
     # type: (schema_pb2.LogicalType) -> LogicalType

     """Construct an instance of a registered LogicalType implementation given a
     proto LogicalType.

     Raises ValueError if no LogicalType registered for the given URN.
     """
     logical_type = cls._known_logical_types.get_logical_type_by_urn(
         logical_type_proto.urn)
     if logical_type is None:
       raise ValueError(
           "No logical type registered for URN '%s'" % logical_type_proto.urn)
     # TODO(bhulette): Use argument
     return logical_type()


 class NoArgumentLogicalType(LogicalType[LanguageT, RepresentationT, None]):
   @classmethod
   def argument_type(cls):
     # type: () -> type
     return None

   def argument(self):
     # type: () -> ArgT
     return None

   @classmethod
   def _from_typing(cls, typ):
     # type: (type) -> LogicalType

     # Since there's no argument, there can be no additional information encoded
     # in the typing. Just construct an instance.
     return cls()


 MicrosInstantRepresentation = NamedTuple(
     'MicrosInstantRepresentation', [('seconds', np.int64),
                                     ('micros', np.int64)])


 @LogicalType.register_logical_type
 class MicrosInstant(NoArgumentLogicalType[Timestamp,
                                           MicrosInstantRepresentation]):
   @classmethod
   def urn(cls):
     return "beam:logical_type:micros_instant:v1"

   @classmethod
   def representation_type(cls):
     # type: () -> type
     return MicrosInstantRepresentation

   @classmethod
   def language_type(cls):
     return Timestamp

   def to_representation_type(self, value):
     # type: (Timestamp) -> MicrosInstantRepresentation
     return MicrosInstantRepresentation(
         value.micros // 1000000, value.micros % 1000000)

   def to_language_type(self, value):
     # type: (MicrosInstantRepresentation) -> Timestamp
     return Timestamp(seconds=int(value.seconds), micros=int(value.micros))
	#
	# Licensed to the Apache Software Foundation (ASF) under one or more
	# contributor license agreements. See the NOTICE file distributed with
	# this work for additional information regarding copyright ownership.
	# The ASF licenses this file to You under the Apache License, Version 2.0
	# (the "License"); you may not use this file except in compliance with
	# the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	#

	""" Support for mapping python types to proto Schemas and back again.

	Imposes a mapping between common Python types and Beam portable schemas
	(https://s.apache.org/beam-schemas)::

	Python Schema
	np.int8 <-----> BYTE
	np.int16 <-----> INT16
	np.int32 <-----> INT32
	np.int64 <-----> INT64
	int ------> INT64
	np.float32 <-----> FLOAT
	np.float64 <-----> DOUBLE
	float ------> DOUBLE
	bool <-----> BOOLEAN
	str/unicode <-----> STRING
	bytes <-----> BYTES
	ByteString ------> BYTES
	Timestamp <-----> LogicalType(urn="beam:logical_type:micros_instant:v1")
	Mapping <-----> MapType
	Sequence <-----> ArrayType
	NamedTuple <-----> RowType
	beam.Row ------> RowType

	Note that some of these mappings are provided as conveniences,
	but they are lossy and will not survive a roundtrip from python to Beam schemas
	and back. For example, the Python type :code:`int` will map to :code:`INT64` in
	Beam schemas but converting that back to a Python type will yield
	:code:`np.int64`.

	:code:`nullable=True` on a Beam :code:`FieldType` is represented in Python by
	wrapping the type in :code:`Optional`.
	"""

	# pytype: skip-file

	from __future__ import absolute_import

	from typing import Any
	from typing import ByteString
	from typing import Generic
	from typing import Mapping
	from typing import NamedTuple
	from typing import Optional
	from typing import Sequence
	from typing import TypeVar
	from uuid import uuid4

	import numpy as np
	from past.builtins import unicode

	from apache_beam.portability.api import schema_pb2
	from apache_beam.typehints import row_type
	from apache_beam.typehints.native_type_compatibility import _get_args
	from apache_beam.typehints.native_type_compatibility import _match_is_exactly_mapping
	from apache_beam.typehints.native_type_compatibility import _match_is_optional
	from apache_beam.typehints.native_type_compatibility import _safe_issubclass
	from apache_beam.typehints.native_type_compatibility import extract_optional_type
	from apache_beam.typehints.native_type_compatibility import match_is_named_tuple
	from apache_beam.utils import proto_utils
	from apache_beam.utils.timestamp import Timestamp

	PYTHON_ANY_URN = "beam:logical:pythonsdk_any:v1"


	# Registry of typings for a schema by UUID
	class SchemaTypeRegistry(object):
	def __init__(self):
	self.by_id = {}
	self.by_typing = {}

	def add(self, typing, schema):
	self.by_id[schema.id] = (typing, schema)

	def get_typing_by_id(self, unique_id):
	result = self.by_id.get(unique_id, None)
	return result[0] if result is not None else None

	def get_schema_by_id(self, unique_id):
	result = self.by_id.get(unique_id, None)
	return result[1] if result is not None else None


	SCHEMA_REGISTRY = SchemaTypeRegistry()

	# Bi-directional mappings
	_PRIMITIVES = (
	(np.int8, schema_pb2.BYTE),
	(np.int16, schema_pb2.INT16),
	(np.int32, schema_pb2.INT32),
	(np.int64, schema_pb2.INT64),
	(np.float32, schema_pb2.FLOAT),
	(np.float64, schema_pb2.DOUBLE),
	(unicode, schema_pb2.STRING),
	(bool, schema_pb2.BOOLEAN),
	(bytes, schema_pb2.BYTES),
	)

	PRIMITIVE_TO_ATOMIC_TYPE = dict((typ, atomic) for typ, atomic in _PRIMITIVES)
	ATOMIC_TYPE_TO_PRIMITIVE = dict((atomic, typ) for typ, atomic in _PRIMITIVES)

	# One-way mappings
	PRIMITIVE_TO_ATOMIC_TYPE.update({
	ByteString: schema_pb2.BYTES,
	# Allow users to specify a native int, and use INT64 as the cross-language
	# representation. Technically ints have unlimited precision, but RowCoder
	# should throw an error if it sees one with a bit width > 64 when encoding.
	int: schema_pb2.INT64,
	float: schema_pb2.DOUBLE,
	})

	# Name of the attribute added to user types (existing and generated) to store
	# the corresponding schema ID
	_BEAM_SCHEMA_ID = "_beam_schema_id"


	def named_fields_to_schema(names_and_types):
	# type: (Sequence[Tuple[str, type]]) -> schema_pb2.Schema
	return schema_pb2.Schema(
	fields=[
	schema_pb2.Field(name=name, type=typing_to_runner_api(type))
	for (name, type) in names_and_types
	],
	id=str(uuid4()))


	def named_fields_from_schema(
	schema): # (schema_pb2.Schema) -> typing.List[typing.Tuple[unicode, type]]
	return [(field.name, typing_from_runner_api(field.type))
	for field in schema.fields]


	def typing_to_runner_api(type_):
	if match_is_named_tuple(type_):
	schema = None
	if hasattr(type_, _BEAM_SCHEMA_ID):
	schema = SCHEMA_REGISTRY.get_schema_by_id(getattr(type_, _BEAM_SCHEMA_ID))
	if schema is None:
	fields = [
	schema_pb2.Field(
	name=name, type=typing_to_runner_api(type_._field_types[name]))
	for name in type_._fields
	]
	type_id = str(uuid4())
	schema = schema_pb2.Schema(fields=fields, id=type_id)
	setattr(type_, _BEAM_SCHEMA_ID, type_id)
	SCHEMA_REGISTRY.add(type_, schema)

	return schema_pb2.FieldType(row_type=schema_pb2.RowType(schema=schema))

	# All concrete types (other than NamedTuple sub-classes) should map to
	# a supported primitive type.
	elif type_ in PRIMITIVE_TO_ATOMIC_TYPE:
	return schema_pb2.FieldType(atomic_type=PRIMITIVE_TO_ATOMIC_TYPE[type_])

	elif _match_is_exactly_mapping(type_):
	key_type, value_type = map(typing_to_runner_api, _get_args(type_))
	return schema_pb2.FieldType(
	map_type=schema_pb2.MapType(key_type=key_type, value_type=value_type))

	elif _match_is_optional(type_):
	# It's possible that a user passes us Optional[Optional[T]], but in python
	# typing this is indistinguishable from Optional[T] - both resolve to
	# Union[T, None] - so there's no need to check for that case here.
	result = typing_to_runner_api(extract_optional_type(type_))
	result.nullable = True
	return result

	elif _safe_issubclass(type_, Sequence):
	element_type = typing_to_runner_api(_get_args(type_)[0])
	return schema_pb2.FieldType(
	array_type=schema_pb2.ArrayType(element_type=element_type))

	elif _safe_issubclass(type_, Mapping):
	key_type, value_type = map(typing_to_runner_api, _get_args(type_))
	return schema_pb2.FieldType(
	map_type=schema_pb2.MapType(key_type=key_type, value_type=value_type))

	try:
	logical_type = LogicalType.from_typing(type_)
	except ValueError:
	# Unknown type, just treat it like Any
	return schema_pb2.FieldType(
	logical_type=schema_pb2.LogicalType(urn=PYTHON_ANY_URN))
	else:
	# TODO(bhulette): Add support for logical types that require arguments
	return schema_pb2.FieldType(
	logical_type=schema_pb2.LogicalType(
	urn=logical_type.urn(),
	representation=typing_to_runner_api(
	logical_type.representation_type())))


	def typing_from_runner_api(fieldtype_proto):
	if fieldtype_proto.nullable:
	# In order to determine the inner type, create a copy of fieldtype_proto
	# with nullable=False and pass back to typing_from_runner_api
	base_type = schema_pb2.FieldType()
	base_type.CopyFrom(fieldtype_proto)
	base_type.nullable = False
	return Optional[typing_from_runner_api(base_type)]

	type_info = fieldtype_proto.WhichOneof("type_info")
	if type_info == "atomic_type":
	try:
	return ATOMIC_TYPE_TO_PRIMITIVE[fieldtype_proto.atomic_type]
	except KeyError:
	raise ValueError(
	"Unsupported atomic type: {0}".format(fieldtype_proto.atomic_type))
	elif type_info == "array_type":
	return Sequence[typing_from_runner_api(
	fieldtype_proto.array_type.element_type)]
	elif type_info == "map_type":
	return Mapping[typing_from_runner_api(fieldtype_proto.map_type.key_type),
	typing_from_runner_api(fieldtype_proto.map_type.value_type)]
	elif type_info == "row_type":
	schema = fieldtype_proto.row_type.schema
	user_type = SCHEMA_REGISTRY.get_typing_by_id(schema.id)
	if user_type is None:
	from apache_beam import coders

	type_name = 'BeamSchema_{}'.format(schema.id.replace('-', '_'))
	user_type = NamedTuple(
	type_name,
	[(field.name, typing_from_runner_api(field.type))
	for field in schema.fields])

	setattr(user_type, _BEAM_SCHEMA_ID, schema.id)

	# Define a reduce function, otherwise these types can't be pickled
	# (See BEAM-9574)
	def __reduce__(self):
	return (
	_hydrate_namedtuple_instance,
	(schema.SerializeToString(), tuple(self)))

	setattr(user_type, '__reduce__', __reduce__)

	SCHEMA_REGISTRY.add(user_type, schema)
	coders.registry.register_coder(user_type, coders.RowCoder)
	return user_type

	elif type_info == "logical_type":
	if fieldtype_proto.logical_type.urn == PYTHON_ANY_URN:
	return Any
	else:
	return LogicalType.from_runner_api(
	fieldtype_proto.logical_type).language_type()


	def _hydrate_namedtuple_instance(encoded_schema, values):
	return named_tuple_from_schema(
	proto_utils.parse_Bytes(encoded_schema, schema_pb2.Schema))(*values)


	def named_tuple_from_schema(schema):
	return typing_from_runner_api(
	schema_pb2.FieldType(row_type=schema_pb2.RowType(schema=schema)))


	def named_tuple_to_schema(named_tuple):
	return typing_to_runner_api(named_tuple).row_type.schema


	def schema_from_element_type(element_type): # (type) -> schema_pb2.Schema
	"""Get a schema for the given PCollection element_type.

	Returns schema as a list of (name, python_type) tuples"""
	if isinstance(element_type, row_type.RowTypeConstraint):
	# TODO(BEAM-10722): Make sure beam.Row generated schemas are registered and
	# de-duped
	return named_fields_to_schema(element_type._fields)
	elif match_is_named_tuple(element_type):
	return named_tuple_to_schema(element_type)
	else:
	raise TypeError(
	"Attempted to determine schema for unsupported type '%s'" %
	element_type)


	def named_fields_from_element_type(
	element_type): # (type) -> typing.List[typing.Tuple[unicode, type]]
	return named_fields_from_schema(schema_from_element_type(element_type))


	# Registry of typings for a schema by UUID
	class LogicalTypeRegistry(object):
	def __init__(self):
	self.by_urn = {}
	self.by_logical_type = {}
	self.by_language_type = {}

	def add(self, urn, logical_type):
	self.by_urn[urn] = logical_type
	self.by_logical_type[logical_type] = urn
	self.by_language_type[logical_type.language_type()] = logical_type

	def get_logical_type_by_urn(self, urn):
	return self.by_urn.get(urn, None)

	def get_urn_by_logial_type(self, logical_type):
	return self.by_logical_type.get(logical_type, None)

	def get_logical_type_by_language_type(self, representation_type):
	return self.by_language_type.get(representation_type, None)


	LanguageT = TypeVar('LanguageT')
	RepresentationT = TypeVar('RepresentationT')
	ArgT = TypeVar('ArgT')


	class LogicalType(Generic[LanguageT, RepresentationT, ArgT]):
	_known_logical_types = LogicalTypeRegistry()

	@classmethod
	def urn(cls):
	# type: () -> unicode

	"""Return the URN used to identify this logical type"""
	raise NotImplementedError()

	@classmethod
	def language_type(cls):
	# type: () -> type

	"""Return the language type this LogicalType encodes.

	The returned type should match LanguageT"""
	raise NotImplementedError()

	@classmethod
	def representation_type(cls):
	# type: () -> type

	"""Return the type of the representation this LogicalType uses to encode the
	language type.

	The returned type should match RepresentationT"""
	raise NotImplementedError()

	@classmethod
	def argument_type(cls):
	# type: () -> type

	"""Return the type of the argument used for variations of this LogicalType.

	The returned type should match ArgT"""
	raise NotImplementedError(cls)

	def argument(self):
	# type: () -> ArgT

	"""Return the argument for this instance of the LogicalType."""
	raise NotImplementedError()

	def to_representation_type(value):
	# type: (LanguageT) -> RepresentationT

	"""Convert an instance of LanguageT to RepresentationT."""
	raise NotImplementedError()

	def to_language_type(value):
	# type: (RepresentationT) -> LanguageT

	"""Convert an instance of RepresentationT to LanguageT."""
	raise NotImplementedError()

	@classmethod
	def register_logical_type(cls, logical_type_cls):
	"""Register an implementation of LogicalType."""
	cls._known_logical_types.add(logical_type_cls.urn(), logical_type_cls)

	@classmethod
	def from_typing(cls, typ):
	# type: (type) -> LogicalType

	"""Construct an instance of a registered LogicalType implementation given a
	typing.

	Raises ValueError if no registered LogicalType implementation can encode the
	given typing."""

	logical_type = cls._known_logical_types.get_logical_type_by_language_type(
	typ)
	if logical_type is None:
	raise ValueError("No logical type registered for typing '%s'" % typ)

	return logical_type._from_typing(typ)

	@classmethod
	def _from_typing(cls, typ):
	# type: (type) -> LogicalType

	"""Construct an instance of this LogicalType implementation given a typing.
	"""
	raise NotImplementedError()

	@classmethod
	def from_runner_api(cls, logical_type_proto):
	# type: (schema_pb2.LogicalType) -> LogicalType

	"""Construct an instance of a registered LogicalType implementation given a
	proto LogicalType.

	Raises ValueError if no LogicalType registered for the given URN.
	"""
	logical_type = cls._known_logical_types.get_logical_type_by_urn(
	logical_type_proto.urn)
	if logical_type is None:
	raise ValueError(
	"No logical type registered for URN '%s'" % logical_type_proto.urn)
	# TODO(bhulette): Use argument
	return logical_type()


	class NoArgumentLogicalType(LogicalType[LanguageT, RepresentationT, None]):
	@classmethod
	def argument_type(cls):
	# type: () -> type
	return None

	def argument(self):
	# type: () -> ArgT
	return None

	@classmethod
	def _from_typing(cls, typ):
	# type: (type) -> LogicalType

	# Since there's no argument, there can be no additional information encoded
	# in the typing. Just construct an instance.
	return cls()


	MicrosInstantRepresentation = NamedTuple(
	'MicrosInstantRepresentation', [('seconds', np.int64),
	('micros', np.int64)])


	@LogicalType.register_logical_type
	class MicrosInstant(NoArgumentLogicalType[Timestamp,
	MicrosInstantRepresentation]):
	@classmethod
	def urn(cls):
	return "beam:logical_type:micros_instant:v1"

	@classmethod
	def representation_type(cls):
	# type: () -> type
	return MicrosInstantRepresentation

	@classmethod
	def language_type(cls):
	return Timestamp

	def to_representation_type(self, value):
	# type: (Timestamp) -> MicrosInstantRepresentation
	return MicrosInstantRepresentation(
	value.micros // 1000000, value.micros % 1000000)

	def to_language_type(self, value):
	# type: (MicrosInstantRepresentation) -> Timestamp
	return Timestamp(seconds=int(value.seconds), micros=int(value.micros))