mirror of
https://github.com/vale981/ray
synced 2025-03-06 02:21:39 -05:00
[Plasma store] Improve the OOM logging message. (#16051)
This commit is contained in:
parent
5d0b302121
commit
d0dc9abdfc
2 changed files with 12 additions and 5 deletions
|
@ -719,11 +719,6 @@ cdef int64_t restore_spilled_objects_handler(
|
||||||
"An unexpected internal error occurred while the IO worker "
|
"An unexpected internal error occurred while the IO worker "
|
||||||
"was restoring spilled objects.")
|
"was restoring spilled objects.")
|
||||||
logger.exception(exception_str)
|
logger.exception(exception_str)
|
||||||
ray._private.utils.push_error_to_driver(
|
|
||||||
ray.worker.global_worker,
|
|
||||||
"restore_spilled_objects_error",
|
|
||||||
traceback.format_exc() + exception_str,
|
|
||||||
job_id=None)
|
|
||||||
return bytes_restored
|
return bytes_restored
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -954,6 +954,18 @@ void PlasmaStore::ReplyToCreateClient(const std::shared_ptr<Client> &client,
|
||||||
PlasmaObject result = {};
|
PlasmaObject result = {};
|
||||||
PlasmaError error;
|
PlasmaError error;
|
||||||
bool finished = create_request_queue_.GetRequestResult(req_id, &result, &error);
|
bool finished = create_request_queue_.GetRequestResult(req_id, &result, &error);
|
||||||
|
if (error == PlasmaError::OutOfMemory) {
|
||||||
|
// Logs are suppressed because there is only one OOM error per 10 seconds.
|
||||||
|
RAY_LOG(INFO) << "Out of memory error is reported to the client for an object id "
|
||||||
|
<< object_id << ". Object store current usage "
|
||||||
|
<< (PlasmaAllocator::Allocated() / 1e9) << " / "
|
||||||
|
<< (PlasmaAllocator::GetFootprintLimit() / 1e9)
|
||||||
|
<< " GB. Pinned unevictable objects after spilling: "
|
||||||
|
<< num_bytes_in_use_ / 1024 / 1024
|
||||||
|
<< " MB. Unsealed objects: " << num_bytes_unsealed_ / 1024 / 1024
|
||||||
|
<< " MB. Object size: "
|
||||||
|
<< (result.data_size + result.metadata_size) / 1024 / 1024 << " MB.";
|
||||||
|
}
|
||||||
if (finished) {
|
if (finished) {
|
||||||
RAY_LOG(DEBUG) << "Finishing create object " << object_id << " request ID " << req_id;
|
RAY_LOG(DEBUG) << "Finishing create object " << object_id << " request ID " << req_id;
|
||||||
if (SendCreateReply(client, object_id, result, error).ok() &&
|
if (SendCreateReply(client, object_id, result, error).ok() &&
|
||||||
|
|
Loading…
Add table
Reference in a new issue