CSV表格行作为前几行的标签

问题描述

我有一个关于TensorFlow的问题。 我有CSV数据,如附加的图像,我想要映射它: 绿色行-是前5行的标签。 是否可以在map函数(Dataet.map())中执行此操作? 如何做到这一点?


解决方案

尝试tf.data.Dataset.window

import tensorflow as tf
import pandas as pd

d = {'A': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], 
     'B': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], 
     'C': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], 
     'D': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], 
     'E': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], 
     'F': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], 
     'G': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12], 
     'H': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12]}

df = pd.DataFrame(data=d)

def redefine_data(windowed_ds):
  data, labels = [], []
  for window in windowed_ds:
    data.append(tf.convert_to_tensor([w for w in window.take(5)]))
    labels.append(next(iter(window.skip(5).take(1))))
  return tf.data.Dataset.from_tensor_slices((data, labels))

ds = tf.data.Dataset.from_tensor_slices((df.values)).window(6, shift=3, stride=1, drop_remainder=True)
ds = redefine_data(ds)
for data, label in ds:
  print(data, label)
tf.Tensor(
[[1 1 1 1 1 1 1 1]
 [2 2 2 2 2 2 2 2]
 [3 3 3 3 3 3 3 3]
 [4 4 4 4 4 4 4 4]
 [5 5 5 5 5 5 5 5]], shape=(5, 8), dtype=int64) tf.Tensor([6 6 6 6 6 6 6 6], shape=(8,), dtype=int64)
tf.Tensor(
[[4 4 4 4 4 4 4 4]
 [5 5 5 5 5 5 5 5]
 [6 6 6 6 6 6 6 6]
 [7 7 7 7 7 7 7 7]
 [8 8 8 8 8 8 8 8]], shape=(5, 8), dtype=int64) tf.Tensor([9 9 9 9 9 9 9 9], shape=(8,), dtype=int64)
tf.Tensor(
[[ 7  7  7  7  7  7  7  7]
 [ 8  8  8  8  8  8  8  8]
 [ 9  9  9  9  9  9  9  9]
 [10 10 10 10 10 10 10 10]
 [11 11 11 11 11 11 11 11]], shape=(5, 8), dtype=int64) tf.Tensor([12 12 12 12 12 12 12 12], shape=(8,), dtype=int64)

相关文章