Question

Я использую пакет cloudml для R в сочетании с пакетом tfestimators для создания и развертывания классификатора DNN с использованием Tensorflow, чтобы я мог использовать его для прогнозирования двоичного файла.ответ (столбец «Ответ» ниже).

Я успешно прошел развертывание моей модели в Google Cloud ML Engine.Это было нелегко.

Я застрял на последней части головоломки - получении прогнозов от моей облачной модели.В частности, мне нужна помощь в структурировании моих данных для аргумента «instance» функции «cloudml_predict». Это - единственная документация по пакету с примером, который я нашел в Интернете для пользователей useR, но я не считаю его применимым к моей ситуации.

Пример набора данных:

library(dplyr)

my_data <- data_frame(
    Response = sample(c("Y", "N"), 1000, replace = TRUE),
    Col1 = sample(c("A", "B"), 1000, replace = TRUE),
    Col2 = sample(c("Happy", "Sad"), 1000, replace = TRUE),
    Col3 = sample(1:100, 1000, replace = TRUE),
    col4 = sample(500:1000, 1000, replace = TRUE),
    Col5 = runif(1000, 0, 1)
)

Это мой сценарий "train.R":

library(tfestimators)
library(caret)        # for even partitioning of dataset

# Create feature columns ----
    FLAGS <- flags(
        flag_numeric("num_epochs", 100)
    )

numeric_cols <- colnames(my_data)[unlist(lapply(my_data, is.numeric))]

cols <- feature_columns(
    column_numeric(numeric_cols),
    column_indicator(
        column_categorical_with_vocabulary_list(
            "Col1",
            vocabulary_list = unique(my_data$Col1),
            dtype = tf$string
        )
    ),
    column_indicator(
        column_categorical_with_vocabulary_list(
            "Col2",
            vocabulary_list = unique(my_data$Col2),
            dtype = tf$string
        )
    ),
    column_indicator(
        column_crossed(
            keys = c("Col1", "Col2"),
            hash_bucket_size = 20L
        )
    )
)



# Split the data into training & test sets ----
set.seed(3456)

inTrain <- createDataPartition(my_data$Response,
                               p = 0.8,
                               list = FALSE,
                               times = 1)

training <- my_data[inTrain, ]
testing  <- my_data[-inTrain, ]

#' Now we need to create an input function with the listing of input and output
#' variables.

pred_fn <- function(data, num_epochs = 10) {
    input_fn(data,
             features = setdiff(names(data), "Response"),
             response = "Response",
             num_epochs = num_epochs)
}

#' Build a deep learning classifier
#' We will create 3 hidden layers, with 80, 40 and 30 nodes, respectively

classifier <- dnn_classifier(
    feature_columns = cols,
    hidden_units = c(80, 40, 30),
    n_classes = 2L,
    label_vocabulary = c("N", "Y"),
    model_dir = "./tmp",
    activation_fn = "relu"
)

classifier %>% tfestimators::train(input_fn = pred_fn(training, num_epochs = FLAGS$num_epochs))
classifier %>% tfestimators::evaluate(input_fn = pred_fn(testing))
classifier %>% predict(input_fn = pred_fn(testing))

#' Help on serving_input_receiver_fn:
#' https://rdrr.io/github/rstudio/tfdeploy/src/tests/testthat/models/tfestimators-example.R
tfestimators::export_savedmodel(classifier,
                                export_dir_base = "savedmodel1",
                                serving_input_receiver_fn = tf$estimator$export$build_parsing_serving_input_receiver_fn(
                                    classifier_parse_example_spec(
                                        feature_columns = cols,
                                        weight_column = NULL,
                                        label_key = "label"
                                    )),
                                as_text = FALSE)

Сценарий развертывания:

library(cloudml)

# Train ----
job <- cloudml_train("train.R")

# Find directory of exported trained model
latest_run()$run_dir

# Deploy the model
# Use result from latest_run()$run_dir to populate file path here
cloudml_deploy("runs/cloudml_2018_10_08_113833889/savedmodel1", name = "test_model")


# Prediction (where I need help) ----

instances <- list()
instances[["instances"]] <- list()
instances$instances[["inputs"]] <- apply(testing[1:1, -1], 1, as.list)

cloudml_predict(name = "test_model",
                version = "test_model_1",
                instances = instances,
                verbose = TRUE)

Самое близкое, что я получил, это следующее сообщение об ошибке:

Error in cloudml_predict(name = "test_model", version = "test_model_1",  : 
  Prediction failed: Error processing input: Expected string, got...

Использование функции прогнозирования в пакете cloudml R

Пожалуйста, войдите или зарегистрируйтесь чтобы ответить на этот вопрос.

Ответы [ 0 ]

Использование функции прогнозирования в пакете cloudml R

Пожалуйста, войдите или зарегистрируйтесь чтобы ответить на этот вопрос.

Ответы [ 0 ]

Похожие темы