You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
- Align archives with ones, updated in PR
7998955
- Use macos-13 instead of macos-12 as last one is not available
- Ubuntu 20.04 is also deprecated (see migration commit in OV
openvinotoolkit/openvino@9e30651)
&& python samples\python\text_generation\lora.py .\TinyLlama\TinyLlama-1.1B-intermediate-step-1431k-3T\ adapter_model.safetensors "How to create a table with two columns, one of them has type float, another one has type int?"
py::class_<StreamerBase, ConstructableStreamer, std::shared_ptr<StreamerBase>>(m, "StreamerBase", streamer_base_docstring) // Change the holder form unique_ptr to shared_ptr
126
-
.def(py::init<>())
127
-
.def("put", &StreamerBase::put, "Put is called every time new token is decoded. Returns a bool flag to indicate whether generation should be stopped, if return true generation stops", py::arg("token"))
128
-
.def("write", &StreamerBase::write, "Write is called every time new token is decoded. Returns a StreamingStatus flag to indicate whether generation should be stopped or cancelled", py::arg("token"))
129
-
.def("end", &StreamerBase::end, "End is called at the end of generation. It can be used to flush cache if your own streamer has one");
auto streamer = py::class_<StreamerBase, ConstructableStreamer, std::shared_ptr<StreamerBase>>(m, "StreamerBase", streamer_base_docstring) // Change the holder form unique_ptr to shared_ptr
131
+
.def(py::init<>())
132
+
.def("write", &StreamerBase::write, "Write is called every time new token is decoded. Returns a StreamingStatus flag to indicate whether generation should be stopped or cancelled", py::arg("token"))
133
+
.def("end", &StreamerBase::end, "End is called at the end of generation. It can be used to flush cache if your own streamer has one");
134
+
135
+
OPENVINO_SUPPRESS_DEPRECATED_START
136
+
streamer.def("put", &StreamerBase::put, "Put is called every time new token is decoded. Returns a bool flag to indicate whether generation should be stopped, if return true generation stops", py::arg("token"));
0 commit comments