Toggle navigation
Toggle navigation
This project
Loading...
Sign in
2021-1-capstone-design2
/
2015104209
Go to a project
Toggle navigation
Toggle navigation pinning
Projects
Groups
Snippets
Help
Project
Activity
Repository
Pipelines
Graphs
Issues
0
Merge Requests
0
Wiki
Snippets
Network
Create a new issue
Builds
Commits
Issue Boards
Authored by
이현규
2021-05-20 00:50:01 +0900
Browse Files
Options
Browse Files
Download
Email Patches
Plain Diff
Commit
15541aeb42e26c6b14e22f45d1e5d4e42dfea6e6
15541aeb
1 parent
c115738b
Add kaggle solution maker
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
448 additions
and
0 deletions
esot3ria/inference_kaggle_solution.py
esot3ria/inference_kaggle_solution.py
0 → 100644
View file @
15541ae
# Copyright 2017 Google Inc. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS-IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Binary for generating predictions over a set of videos."""
from
__future__
import
print_function
import
glob
import
heapq
import
json
import
os
import
tarfile
import
tempfile
import
time
import
numpy
as
np
import
readers
from
six.moves
import
urllib
import
tensorflow
as
tf
from
tensorflow
import
app
from
tensorflow
import
flags
from
tensorflow
import
gfile
from
tensorflow
import
logging
from
tensorflow.python.lib.io
import
file_io
import
utils
from
collections
import
Counter
import
operator
FLAGS
=
flags
.
FLAGS
if
__name__
==
"__main__"
:
# Input
flags
.
DEFINE_string
(
"train_dir"
,
"./new_model"
,
"The directory to load the model files from. We assume "
"that you have already run eval.py onto this, such that "
"inference_model.* files already exist."
)
flags
.
DEFINE_string
(
"input_data_pattern"
,
"/Volumes/HDD/develop/yt8m/3/frame/test/test*.tfrecord"
,
"File glob defining the evaluation dataset in tensorflow.SequenceExample "
"format. The SequenceExamples are expected to have an 'rgb' byte array "
"sequence feature as well as a 'labels' int64 context feature."
)
flags
.
DEFINE_string
(
"input_model_tgz"
,
""
,
"If given, must be path to a .tgz file that was written "
"by this binary using flag --output_model_tgz. In this "
"case, the .tgz file will be untarred to "
"--untar_model_dir and the model will be used for "
"inference."
)
flags
.
DEFINE_string
(
"untar_model_dir"
,
"/tmp/yt8m-model"
,
"If --input_model_tgz is given, then this directory will "
"be created and the contents of the .tgz file will be "
"untarred here."
)
flags
.
DEFINE_bool
(
"segment_labels"
,
True
,
"If set, then --input_data_pattern must be frame-level features (but with"
" segment_labels). Otherwise, --input_data_pattern must be aggregated "
"video-level features. The model must also be set appropriately (i.e. to "
"read 3D batches VS 4D batches."
)
flags
.
DEFINE_integer
(
"segment_max_pred"
,
100000
,
"Limit total number of segment outputs per entity."
)
flags
.
DEFINE_string
(
"segment_label_ids_file"
,
"https://raw.githubusercontent.com/google/youtube-8m/master/segment_label_ids.csv"
,
"The file that contains the segment label ids."
)
# Output
flags
.
DEFINE_string
(
"output_file"
,
"/Users/esot3ria/kaggle_solution.csv"
,
"The file to save the predictions to."
)
flags
.
DEFINE_string
(
"output_model_tgz"
,
""
,
"If given, should be a filename with a .tgz extension, "
"the model graph and checkpoint will be bundled in this "
"gzip tar. This file can be uploaded to Kaggle for the "
"top 10 participants."
)
flags
.
DEFINE_integer
(
"top_k"
,
5
,
"How many predictions to output per video."
)
# Other flags.
flags
.
DEFINE_integer
(
"batch_size"
,
512
,
"How many examples to process per batch."
)
flags
.
DEFINE_integer
(
"num_readers"
,
1
,
"How many threads to use for reading input files."
)
def
format_lines
(
video_ids
,
predictions
,
top_k
,
whitelisted_cls_mask
=
None
):
"""Create an information line the submission file."""
batch_size
=
len
(
video_ids
)
for
video_index
in
range
(
batch_size
):
video_prediction
=
predictions
[
video_index
]
if
whitelisted_cls_mask
is
not
None
:
# Whitelist classes.
video_prediction
*=
whitelisted_cls_mask
top_indices
=
np
.
argpartition
(
video_prediction
,
-
top_k
)[
-
top_k
:]
line
=
[(
class_index
,
predictions
[
video_index
][
class_index
])
for
class_index
in
top_indices
]
line
=
sorted
(
line
,
key
=
lambda
p
:
-
p
[
1
])
yield
(
video_ids
[
video_index
]
+
","
+
" "
.
join
(
"
%
i
%
g"
%
(
label
,
score
)
for
(
label
,
score
)
in
line
)
+
"
\n
"
)
.
encode
(
"utf8"
)
def
get_input_data_tensors
(
reader
,
data_pattern
,
batch_size
,
num_readers
=
1
):
"""Creates the section of the graph which reads the input data.
Args:
reader: A class which parses the input data.
data_pattern: A 'glob' style path to the data files.
batch_size: How many examples to process at a time.
num_readers: How many I/O threads to use.
Returns:
A tuple containing the features tensor, labels tensor, and optionally a
tensor containing the number of frames per video. The exact dimensions
depend on the reader being used.
Raises:
IOError: If no files matching the given pattern were found.
"""
with
tf
.
name_scope
(
"input"
):
files
=
gfile
.
Glob
(
data_pattern
)
if
not
files
:
raise
IOError
(
"Unable to find input files. data_pattern='"
+
data_pattern
+
"'"
)
logging
.
info
(
"number of input files: "
+
str
(
len
(
files
)))
filename_queue
=
tf
.
train
.
string_input_producer
(
files
,
num_epochs
=
1
,
shuffle
=
False
)
examples_and_labels
=
[
reader
.
prepare_reader
(
filename_queue
)
for
_
in
range
(
num_readers
)
]
input_data_dict
=
(
tf
.
train
.
batch_join
(
examples_and_labels
,
batch_size
=
batch_size
,
allow_smaller_final_batch
=
True
,
enqueue_many
=
True
))
video_id_batch
=
input_data_dict
[
"video_ids"
]
video_batch
=
input_data_dict
[
"video_matrix"
]
num_frames_batch
=
input_data_dict
[
"num_frames"
]
return
video_id_batch
,
video_batch
,
num_frames_batch
def
get_segments
(
batch_video_mtx
,
batch_num_frames
,
segment_size
):
"""Get segment-level inputs from frame-level features."""
video_batch_size
=
batch_video_mtx
.
shape
[
0
]
max_frame
=
batch_video_mtx
.
shape
[
1
]
feature_dim
=
batch_video_mtx
.
shape
[
-
1
]
padded_segment_sizes
=
(
batch_num_frames
+
segment_size
-
1
)
//
segment_size
padded_segment_sizes
*=
segment_size
segment_mask
=
(
0
<
(
padded_segment_sizes
[:,
np
.
newaxis
]
-
np
.
arange
(
0
,
max_frame
)))
# Segment bags.
frame_bags
=
batch_video_mtx
.
reshape
((
-
1
,
feature_dim
))
segment_frames
=
frame_bags
[
segment_mask
.
reshape
(
-
1
)]
.
reshape
(
(
-
1
,
segment_size
,
feature_dim
))
# Segment num frames.
segment_start_times
=
np
.
arange
(
0
,
max_frame
,
segment_size
)
num_segments
=
batch_num_frames
[:,
np
.
newaxis
]
-
segment_start_times
num_segment_bags
=
num_segments
.
reshape
((
-
1
))
valid_segment_mask
=
num_segment_bags
>
0
segment_num_frames
=
num_segment_bags
[
valid_segment_mask
]
segment_num_frames
[
segment_num_frames
>
segment_size
]
=
segment_size
max_segment_num
=
(
max_frame
+
segment_size
-
1
)
//
segment_size
video_idxs
=
np
.
tile
(
np
.
arange
(
0
,
video_batch_size
)[:,
np
.
newaxis
],
[
1
,
max_segment_num
])
segment_idxs
=
np
.
tile
(
segment_start_times
,
[
video_batch_size
,
1
])
idx_bags
=
np
.
stack
([
video_idxs
,
segment_idxs
],
axis
=-
1
)
.
reshape
((
-
1
,
2
))
video_segment_ids
=
idx_bags
[
valid_segment_mask
]
return
{
"video_batch"
:
segment_frames
,
"num_frames_batch"
:
segment_num_frames
,
"video_segment_ids"
:
video_segment_ids
}
def
normalize_tag
(
tag
):
if
isinstance
(
tag
,
str
):
new_tag
=
tag
.
lower
()
.
replace
(
'[^a-zA-Z]'
,
' '
)
if
new_tag
.
find
(
" ("
)
!=
-
1
:
new_tag
=
new_tag
[:
new_tag
.
find
(
" ("
)]
new_tag
=
new_tag
.
replace
(
" "
,
"-"
)
return
new_tag
else
:
return
tag
def
inference
(
reader
,
train_dir
,
data_pattern
,
out_file_location
,
batch_size
,
top_k
):
"""Inference function."""
with
tf
.
Session
(
config
=
tf
.
ConfigProto
(
allow_soft_placement
=
True
))
as
sess
,
gfile
.
Open
(
out_file_location
,
"w+"
)
as
out_file
:
video_id_batch
,
video_batch
,
num_frames_batch
=
get_input_data_tensors
(
reader
,
data_pattern
,
batch_size
)
inference_model_name
=
"segment_inference_model"
if
FLAGS
.
segment_labels
else
"inference_model"
checkpoint_file
=
os
.
path
.
join
(
train_dir
,
"inference_model"
,
inference_model_name
)
if
not
gfile
.
Exists
(
checkpoint_file
+
".meta"
):
raise
IOError
(
"Cannot find
%
s. Did you run eval.py?"
%
checkpoint_file
)
meta_graph_location
=
checkpoint_file
+
".meta"
logging
.
info
(
"loading meta-graph: "
+
meta_graph_location
)
if
FLAGS
.
output_model_tgz
:
with
tarfile
.
open
(
FLAGS
.
output_model_tgz
,
"w:gz"
)
as
tar
:
for
model_file
in
glob
.
glob
(
checkpoint_file
+
".*"
):
tar
.
add
(
model_file
,
arcname
=
os
.
path
.
basename
(
model_file
))
tar
.
add
(
os
.
path
.
join
(
train_dir
,
"model_flags.json"
),
arcname
=
"model_flags.json"
)
print
(
"Tarred model onto "
+
FLAGS
.
output_model_tgz
)
with
tf
.
device
(
"/cpu:0"
):
saver
=
tf
.
train
.
import_meta_graph
(
meta_graph_location
,
clear_devices
=
True
)
logging
.
info
(
"restoring variables from "
+
checkpoint_file
)
saver
.
restore
(
sess
,
checkpoint_file
)
input_tensor
=
tf
.
get_collection
(
"input_batch_raw"
)[
0
]
num_frames_tensor
=
tf
.
get_collection
(
"num_frames"
)[
0
]
predictions_tensor
=
tf
.
get_collection
(
"predictions"
)[
0
]
# Workaround for num_epochs issue.
def
set_up_init_ops
(
variables
):
init_op_list
=
[]
for
variable
in
list
(
variables
):
if
"train_input"
in
variable
.
name
:
init_op_list
.
append
(
tf
.
assign
(
variable
,
1
))
variables
.
remove
(
variable
)
init_op_list
.
append
(
tf
.
variables_initializer
(
variables
))
return
init_op_list
sess
.
run
(
set_up_init_ops
(
tf
.
get_collection_ref
(
tf
.
GraphKeys
.
LOCAL_VARIABLES
)))
coord
=
tf
.
train
.
Coordinator
()
threads
=
tf
.
train
.
start_queue_runners
(
sess
=
sess
,
coord
=
coord
)
num_examples_processed
=
0
start_time
=
time
.
time
()
whitelisted_cls_mask
=
None
if
FLAGS
.
segment_labels
:
final_out_file
=
out_file
out_file
=
tempfile
.
NamedTemporaryFile
()
logging
.
info
(
"Segment temp prediction output will be written to temp file:
%
s"
,
out_file
.
name
)
if
FLAGS
.
segment_label_ids_file
:
whitelisted_cls_mask
=
np
.
zeros
((
predictions_tensor
.
get_shape
()[
-
1
],),
dtype
=
np
.
float32
)
segment_label_ids_file
=
FLAGS
.
segment_label_ids_file
if
segment_label_ids_file
.
startswith
(
"http"
):
logging
.
info
(
"Retrieving segment ID whitelist files from
%
s..."
,
segment_label_ids_file
)
segment_label_ids_file
,
_
=
urllib
.
request
.
urlretrieve
(
segment_label_ids_file
)
with
tf
.
io
.
gfile
.
GFile
(
segment_label_ids_file
)
as
fobj
:
for
line
in
fobj
:
try
:
cls_id
=
int
(
line
)
whitelisted_cls_mask
[
cls_id
]
=
1.
except
ValueError
:
# Simply skip the non-integer line.
continue
out_file
.
write
(
u"VideoId,LabelConfidencePairs
\n
"
.
encode
(
"utf8"
))
# =========================================
# open vocab csv file and store to dictionary
# =========================================
voca_dict
=
{}
vocabs
=
open
(
"./statics/vocabulary.csv"
,
'r'
)
while
True
:
line
=
vocabs
.
readline
()
if
not
line
:
break
vocab_dict_item
=
line
.
split
(
","
)
if
vocab_dict_item
[
0
]
!=
"Index"
:
voca_dict
[
vocab_dict_item
[
0
]]
=
vocab_dict_item
[
3
]
vocabs
.
close
()
try
:
while
not
coord
.
should_stop
():
video_id_batch_val
,
video_batch_val
,
num_frames_batch_val
=
sess
.
run
(
[
video_id_batch
,
video_batch
,
num_frames_batch
])
if
FLAGS
.
segment_labels
:
results
=
get_segments
(
video_batch_val
,
num_frames_batch_val
,
5
)
video_segment_ids
=
results
[
"video_segment_ids"
]
video_id_batch_val
=
video_id_batch_val
[
video_segment_ids
[:,
0
]]
video_id_batch_val
=
np
.
array
([
"
%
s:
%
d"
%
(
x
.
decode
(
"utf8"
),
y
)
for
x
,
y
in
zip
(
video_id_batch_val
,
video_segment_ids
[:,
1
])
])
video_batch_val
=
results
[
"video_batch"
]
num_frames_batch_val
=
results
[
"num_frames_batch"
]
if
input_tensor
.
get_shape
()[
1
]
!=
video_batch_val
.
shape
[
1
]:
raise
ValueError
(
"max_frames mismatch. Please re-run the eval.py "
"with correct segment_labels settings."
)
predictions_val
,
=
sess
.
run
([
predictions_tensor
],
feed_dict
=
{
input_tensor
:
video_batch_val
,
num_frames_tensor
:
num_frames_batch_val
})
now
=
time
.
time
()
num_examples_processed
+=
len
(
video_batch_val
)
elapsed_time
=
now
-
start_time
logging
.
info
(
"num examples processed: "
+
str
(
num_examples_processed
)
+
" elapsed seconds: "
+
"{0:.2f}"
.
format
(
elapsed_time
)
+
" examples/sec:
%.2
f"
%
(
num_examples_processed
/
elapsed_time
))
for
line
in
format_lines
(
video_id_batch_val
,
predictions_val
,
top_k
,
whitelisted_cls_mask
):
out_file
.
write
(
line
)
out_file
.
flush
()
except
tf
.
errors
.
OutOfRangeError
:
logging
.
info
(
"Done with inference. The output file was written to "
+
out_file
.
name
)
finally
:
coord
.
request_stop
()
if
FLAGS
.
segment_labels
:
# Re-read the file and do heap sort.
# Create multiple heaps.
logging
.
info
(
"Post-processing segment predictions..."
)
segment_id_list
=
[]
segment_classes
=
[]
cls_result_arr
=
[]
cls_score_dict
=
{}
out_file
.
seek
(
0
,
0
)
old_seg_name
=
'0000'
counter
=
0
for
line
in
out_file
:
counter
+=
1
if
counter
/
5000
==
0
:
print
(
counter
,
" processed"
)
segment_id
,
preds
=
line
.
decode
(
"utf8"
)
.
split
(
","
)
if
segment_id
==
"VideoId"
:
# Skip the headline.
continue
preds
=
preds
.
split
(
" "
)
pred_cls_ids
=
[
int
(
preds
[
idx
])
for
idx
in
range
(
0
,
len
(
preds
),
2
)]
pred_cls_scores
=
[
float
(
preds
[
idx
])
for
idx
in
range
(
1
,
len
(
preds
),
2
)]
# =======================================
segment_id
=
str
(
segment_id
.
split
(
":"
)[
0
])
if
segment_id
not
in
segment_id_list
:
segment_id_list
.
append
(
str
(
segment_id
))
segment_classes
.
append
(
""
)
index
=
segment_id_list
.
index
(
segment_id
)
if
old_seg_name
!=
segment_id
:
cls_score_dict
[
segment_id
]
=
{}
old_seg_name
=
segment_id
for
classes
in
range
(
0
,
len
(
pred_cls_ids
)):
# pred_cls_ids:
segment_classes
[
index
]
=
str
(
segment_classes
[
index
])
+
str
(
pred_cls_ids
[
classes
])
+
" "
# append classes from new segment
if
pred_cls_ids
[
classes
]
in
cls_score_dict
[
segment_id
]:
cls_score_dict
[
segment_id
][
pred_cls_ids
[
classes
]]
=
cls_score_dict
[
segment_id
][
pred_cls_ids
[
classes
]]
+
\
pred_cls_scores
[
classes
]
else
:
cls_score_dict
[
segment_id
][
pred_cls_ids
[
classes
]]
=
pred_cls_scores
[
classes
]
for
segs
,
item
in
zip
(
segment_id_list
,
segment_classes
):
# print('====== R E C O R D ======')
cls_arr
=
item
.
split
(
" "
)[:
-
1
]
cls_arr
=
list
(
map
(
int
,
cls_arr
))
cls_arr
=
sorted
(
cls_arr
)
# 클래스별로 정렬
result_string
=
""
temp
=
cls_score_dict
[
segs
]
temp
=
sorted
(
temp
.
items
(),
key
=
operator
.
itemgetter
(
1
),
reverse
=
True
)
# 밸류값 기준으로 정렬
demoninator
=
float
(
temp
[
0
][
1
]
+
temp
[
1
][
1
]
+
temp
[
2
][
1
]
+
temp
[
3
][
1
]
+
temp
[
4
][
1
])
# for item in temp:
for
itemIndex
in
range
(
0
,
top_k
):
# Normalize tag name
segment_tag
=
str
(
voca_dict
[
str
(
temp
[
itemIndex
][
0
])])
normalized_tag
=
normalize_tag
(
segment_tag
)
result_string
=
result_string
+
normalized_tag
+
":"
+
format
(
temp
[
itemIndex
][
1
]
/
demoninator
,
".3f"
)
+
","
cls_result_arr
.
append
(
result_string
[:
-
1
])
logging
.
info
(
segs
+
" : "
+
result_string
[:
-
1
])
# =======================================
final_out_file
.
write
(
"vid_id,segment1,segment2,segment3,segment4,segment5
\n
"
)
for
seg_id
,
class_indcies
in
zip
(
segment_id_list
,
cls_result_arr
):
final_out_file
.
write
(
"
%
s,
%
s
\n
"
%
(
seg_id
,
str
(
class_indcies
)))
final_out_file
.
close
()
out_file
.
close
()
coord
.
join
(
threads
)
sess
.
close
()
def
main
(
unused_argv
):
logging
.
set_verbosity
(
tf
.
logging
.
INFO
)
if
FLAGS
.
input_model_tgz
:
if
FLAGS
.
train_dir
:
raise
ValueError
(
"You cannot supply --train_dir if supplying "
"--input_model_tgz"
)
# Untar.
if
not
os
.
path
.
exists
(
FLAGS
.
untar_model_dir
):
os
.
makedirs
(
FLAGS
.
untar_model_dir
)
tarfile
.
open
(
FLAGS
.
input_model_tgz
)
.
extractall
(
FLAGS
.
untar_model_dir
)
FLAGS
.
train_dir
=
FLAGS
.
untar_model_dir
flags_dict_file
=
os
.
path
.
join
(
FLAGS
.
train_dir
,
"model_flags.json"
)
if
not
file_io
.
file_exists
(
flags_dict_file
):
raise
IOError
(
"Cannot find
%
s. Did you run eval.py?"
%
flags_dict_file
)
flags_dict
=
json
.
loads
(
file_io
.
FileIO
(
flags_dict_file
,
"r"
)
.
read
())
# convert feature_names and feature_sizes to lists of values
feature_names
,
feature_sizes
=
utils
.
GetListOfFeatureNamesAndSizes
(
flags_dict
[
"feature_names"
],
flags_dict
[
"feature_sizes"
])
if
flags_dict
[
"frame_features"
]:
reader
=
readers
.
YT8MFrameFeatureReader
(
feature_names
=
feature_names
,
feature_sizes
=
feature_sizes
)
else
:
reader
=
readers
.
YT8MAggregatedFeatureReader
(
feature_names
=
feature_names
,
feature_sizes
=
feature_sizes
)
if
not
FLAGS
.
output_file
:
raise
ValueError
(
"'output_file' was not specified. "
"Unable to continue with inference."
)
if
not
FLAGS
.
input_data_pattern
:
raise
ValueError
(
"'input_data_pattern' was not specified. "
"Unable to continue with inference."
)
inference
(
reader
,
FLAGS
.
train_dir
,
FLAGS
.
input_data_pattern
,
FLAGS
.
output_file
,
FLAGS
.
batch_size
,
FLAGS
.
top_k
)
if
__name__
==
"__main__"
:
app
.
run
()
\ No newline at end of file
Please
register
or
login
to post a comment