/* Copyright 2016 The TensorFlow Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. ==============================================================================*/ // A set of lightweight wrappers which simplify access to Feature protos. // // TensorFlow Example proto uses associative maps on top of oneof fields. // SequenceExample proto uses associative map of FeatureList. // So accessing feature values is not very convenient. // // For example, to read a first value of integer feature "tag": // int id = example.features().feature().at("tag").int64_list().value(0) // // to add a value: // auto features = example->mutable_features(); // (*features->mutable_feature())["tag"].mutable_int64_list()->add_value(id) // // For float features you have to use float_list, for string - bytes_list. // // To do the same with this library: // int id = GetFeatureValues("tag", example).Get(0); // GetFeatureValues("tag", &example)->Add(id); // // Modification of bytes features is slightly different: // auto tag = GetFeatureValues("tag", &example); // *tag->Add() = "lorem ipsum"; // // To copy multiple values into a feature: // AppendFeatureValues({1,2,3}, "tag", &example); // // GetFeatureValues gives you access to underlying data - RepeatedField object // (RepeatedPtrField for byte list). So refer to its documentation of // RepeatedField for full list of supported methods. // // NOTE: Due to the nature of oneof proto fields setting a feature of one type // automatically clears all values stored as another type with the same feature // key. // // This library also has tools to work with SequenceExample protos. // // To get a value from SequenceExample.context: // int id = GetFeatureValues("tag", se.context()).Get(0); // To add a value to the context: // GetFeatureValues("tag", se.mutable_context())->Add(42); // // To add values to feature_lists: // AppendFeatureValues({4.0}, // GetFeatureList("images", &se)->Add()); // AppendFeatureValues({5.0, 3.0}, // GetFeatureList("images", &se)->Add()); // This will create a feature list keyed as "images" with two features: // feature_lists { // feature_list { // key: "images" // value { // feature { float_list { value: [4.0] } } // feature { float_list { value: [5.0, 3.0] } } // } // } } // // Functions exposed by this library: // HasFeature<[FeatureType]>(key, proto) -> bool // Returns true if a feature with the specified key, and optionally // FeatureType, belongs to the Features or Example proto. // HasFeatureList(key, sequence_example) -> bool // Returns true if SequenceExample has a feature_list with the key. // GetFeatureValues(key, proto) -> RepeatedField // Returns values for the specified key and the FeatureType. // Supported types for the proto: Example, Features. // GetFeatureList(key, sequence_example) -> RepeatedPtrField // Returns Feature protos associated with a key. // AppendFeatureValues(begin, end, feature) // AppendFeatureValues(container or initializer_list, feature) // Copies values into a Feature. // AppendFeatureValues(begin, end, key, proto) // AppendFeatureValues(container or initializer_list, key, proto) // Copies values into Features and Example protos with the specified key. // // Auxiliary functions, it is unlikely you'll need to use them directly: // GetFeatures(proto) -> Features // A convenience function to get Features proto. // Supported types for the proto: Example, Features. // GetFeature(key, proto) -> Feature* // Returns a Feature proto for the specified key, creates a new if // necessary. Supported types for the proto: Example, Features. // GetFeatureValues(feature) -> RepeatedField // Returns values of the feature for the FeatureType. #ifndef TENSORFLOW_CORE_EXAMPLE_FEATURE_UTIL_H_ #define TENSORFLOW_CORE_EXAMPLE_FEATURE_UTIL_H_ #include #include #include "absl/base/macros.h" #include "tensorflow/core/example/example.pb.h" #include "tensorflow/core/example/feature.pb.h" #include "tensorflow/core/lib/core/stringpiece.h" #include "tensorflow/core/platform/protobuf.h" #include "tensorflow/core/platform/types.h" namespace tensorflow { namespace internal { // TODO(gorban): Update all clients in a followup CL. // Returns a reference to a feature corresponding to the name. // Note: it will create a new Feature if it is missing in the example. ABSL_DEPRECATED("Use GetFeature instead.") Feature& ExampleFeature(const string& name, Example* example); // Specializations of RepeatedFieldTrait define a type of RepeatedField // corresponding to a selected feature type. template struct RepeatedFieldTrait; template <> struct RepeatedFieldTrait { using Type = protobuf::RepeatedField; }; template <> struct RepeatedFieldTrait { using Type = protobuf::RepeatedField; }; template <> struct RepeatedFieldTrait { using Type = protobuf::RepeatedPtrField; }; // Specializations of FeatureTrait define a type of feature corresponding to a // selected value type. template struct FeatureTrait; template struct FeatureTrait::value>::type> { using Type = protobuf_int64; }; template struct FeatureTrait< ValueType, typename std::enable_if::value>::type> { using Type = float; }; template struct is_string : public std::integral_constant< bool, std::is_same::type>::value || std::is_same::type>::value> { }; template <> struct is_string : std::true_type {}; template <> struct is_string<::tensorflow::StringPiece> : std::true_type {}; template struct FeatureTrait< ValueType, typename std::enable_if::value>::type> { using Type = string; }; } // namespace internal // Returns true if sequence_example has a feature_list with the specified key. bool HasFeatureList(const string& key, const SequenceExample& sequence_example); template struct TypeHasFeatures : std::false_type {}; template <> struct TypeHasFeatures : std::true_type {}; template <> struct TypeHasFeatures : std::true_type {}; // A family of template functions to return mutable Features proto from a // container proto. Supported ProtoTypes: Example, Features. template typename std::enable_if::value, Features*>::type GetFeatures(ProtoType* proto); template typename std::enable_if::value, const Features&>::type GetFeatures(const ProtoType& proto); // Base declaration of a family of template functions to return a read only // repeated field of feature values. template const typename internal::RepeatedFieldTrait::Type& GetFeatureValues(const Feature& feature); // Returns a read only repeated field corresponding to a feature with the // specified name and FeatureType. Supported ProtoTypes: Example, Features. template const typename internal::RepeatedFieldTrait::Type& GetFeatureValues(const string& key, const ProtoType& proto) { return GetFeatureValues(GetFeatures(proto).feature().at(key)); } // Returns a mutable repeated field of a feature values. template typename internal::RepeatedFieldTrait::Type* GetFeatureValues( Feature* feature); // Returns a mutable repeated field corresponding to a feature with the // specified name and FeatureType. Supported ProtoTypes: Example, Features. template typename internal::RepeatedFieldTrait::Type* GetFeatureValues( const string& key, ProtoType* proto) { ::tensorflow::Feature& feature = (*GetFeatures(proto)->mutable_feature())[key]; return GetFeatureValues(&feature); } // Returns a Feature proto for the specified key, creates a new if necessary. // Supported types for the proto: Example, Features. template Feature* GetFeature(const string& key, ProtoType* proto) { return &(*GetFeatures(proto)->mutable_feature())[key]; } // Returns a repeated field with features corresponding to a feature_list key. const protobuf::RepeatedPtrField& GetFeatureList( const string& key, const SequenceExample& sequence_example); // Returns a mutable repeated field with features corresponding to a // feature_list key. It will create a new FeatureList if necessary. protobuf::RepeatedPtrField* GetFeatureList( const string& feature_list_key, SequenceExample* sequence_example); template void AppendFeatureValues(IteratorType first, IteratorType last, Feature* feature) { using FeatureType = typename internal::FeatureTrait< typename std::iterator_traits::value_type>::Type; std::copy(first, last, protobuf::RepeatedFieldBackInserter( GetFeatureValues(feature))); } template void AppendFeatureValues(std::initializer_list container, Feature* feature) { AppendFeatureValues(container.begin(), container.end(), feature); } template void AppendFeatureValues(const ContainerType& container, Feature* feature) { using IteratorType = typename ContainerType::const_iterator; AppendFeatureValues(container.begin(), container.end(), feature); } // Copies elements from the range, defined by [first, last) into the feature // obtainable from the (proto, key) combination. template void AppendFeatureValues(IteratorType first, IteratorType last, const string& key, ProtoType* proto) { AppendFeatureValues(first, last, GetFeature(key, GetFeatures(proto))); } // Copies all elements from the container into a feature. template void AppendFeatureValues(const ContainerType& container, const string& key, ProtoType* proto) { using IteratorType = typename ContainerType::const_iterator; AppendFeatureValues(container.begin(), container.end(), key, proto); } // Copies all elements from the initializer list into a Feature contained by // Features or Example proto. template void AppendFeatureValues(std::initializer_list container, const string& key, ProtoType* proto) { using IteratorType = typename std::initializer_list::const_iterator; AppendFeatureValues(container.begin(), container.end(), key, proto); } // Returns true if a feature with the specified key belongs to the Features. // The template parameter pack accepts zero or one template argument - which // is FeatureType. If the FeatureType not specified (zero template arguments) // the function will not check the feature type. Otherwise it will return false // if the feature has a wrong type. template bool HasFeature(const string& key, const Features& features); // Returns true if a feature with the specified key belongs to the Example. // Doesn't check feature type if used without FeatureType, otherwise the // specialized versions return false if the feature has a wrong type. template bool HasFeature(const string& key, const Example& example) { return HasFeature(key, GetFeatures(example)); } // TODO(gorban): update all clients in a followup CL. template ABSL_DEPRECATED("Use HasFeature instead.") bool ExampleHasFeature(const string& key, const Example& example) { return HasFeature(key, example); } } // namespace tensorflow #endif // TENSORFLOW_CORE_EXAMPLE_FEATURE_UTIL_H_