{"payload":{"header_redesign_enabled":false,"results":[{"id":"691533062","archived":false,"color":"#DA5B0B","followers":0,"has_funding_file":false,"hl_name":"Mahsatajik/Reinforcement-Learning","hl_trunc_description":"University of Tehran-Reinforcement Learning Fall 2022","language":"Jupyter Notebook","mirror":false,"owned_by_organization":false,"public":true,"repo":{"repository":{"id":691533062,"name":"Reinforcement-Learning","owner_id":144895424,"owner_login":"Mahsatajik","updated_at":"2024-05-25T14:03:52.231Z","has_issues":true}},"sponsorable":false,"topics":["python","reinforcement-learning","monte-carlo","deep-reinforcement-learning","dqn","reinforcement-learning-algorithms","dynamic-programming","markov-decision-processes","policy-iteration","value-iteration","object-oriented-programming","gym-environment","temporal-difference-learning","sarsa-algorithm","q-learning-algorithm"],"type":"Public","help_wanted_issues_count":0,"good_first_issue_issues_count":0,"starred_by_current_user":false}],"type":"repositories","page":1,"page_count":1,"elapsed_millis":66,"errors":[],"result_count":1,"facets":[],"protected_org_logins":[],"topics":null,"query_id":"","logged_in":false,"sign_up_path":"/signup?source=code_search_results","sign_in_path":"/login?return_to=https%3A%2F%2Fgithub.com%2Fsearch%3Fq%3Drepo%253AMahsatajik%252FReinforcement-Learning%2B%2Blanguage%253A%2522Jupyter%2BNotebook%2522","metadata":null,"warn_limited_results":false,"csrf_tokens":{"/Mahsatajik/Reinforcement-Learning/star":{"post":"W5HIzcVSAcvzxnOs_w_BMUUpYXiCVKZPFqv4oytNkMGQN3l3StI7mQVqD44zhe_XuIEsoRCFfYl4jpl-5RGljA"},"/Mahsatajik/Reinforcement-Learning/unstar":{"post":"jXhgiCMGGxmEYV4ec3oMMggHFN4S2XnmmxRHwGc6cbcMgK9xkJiJ6up6X_XsSKT6OMpP1E-xxl6eh0Dmd4dY2w"},"/sponsors/batch_deferred_sponsor_buttons":{"post":"7UenbLEIkdwq8MigUdnj0Qxe35G1WX_BX9SeMLBcLvQpkxBj7aYvwqXpVYpNA3jQPc78ag_LvA-xIn_zeCghWg"}}},"title":"Repository search results"}