{"id":305,"slug":"humancompatibleai--ppo-pendulum-v1","name":"ppo-Pendulum-v1","author":"HumanCompatibleAI","description":null,"tags":"[\"Reinforcement-Learning\",\"Stable-Baselines3\",\"Pendulum-V1\",\"Deep-Reinforcement-Learning\",\"Model-Index\"]","license":null,"framework":"reinforcement-learning","parameters":null,"downloads":61513,"likes":5,"verified":0,"created_at":"2026-04-20 22:04:14","updated_at":"2026-05-07 22:31:01","source_url":"https://huggingface.co/HumanCompatibleAI/ppo-Pendulum-v1","source_platform":"huggingface","hf_repo_id":"HumanCompatibleAI/ppo-Pendulum-v1","ollama_name":"","category":"model","latest_version":"v1.0.0","version_count":1,"signature_count":1,"risk_level":"MEDIUM","risk_score":50,"versions":[{"id":304,"model_id":305,"version":"v1.0.0","manifest_hash":"3f88c99cbc8db9151f0c6fde4181beff3e49407e0703ae376afa5ca44406fb79","file_count":15,"total_size":469852,"r2_manifest_key":"manifests/humancompatibleai--ppo-pendulum-v1/v1.0.0.json","created_at":"2026-04-20 22:04:14"}],"files":[{"id":8802,"version_id":304,"filename":".gitattributes","sha3_256_hash":"pending-verification","size":1386},{"id":8803,"version_id":304,"filename":"README.md","sha3_256_hash":"pending-verification","size":2398},{"id":8804,"version_id":304,"filename":"args.yml","sha3_256_hash":"pending-verification","size":1204},{"id":8805,"version_id":304,"filename":"config.yml","sha3_256_hash":"pending-verification","size":367},{"id":8806,"version_id":304,"filename":"env_kwargs.yml","sha3_256_hash":"pending-verification","size":23},{"id":8807,"version_id":304,"filename":"ppo-Pendulum-v1.zip","sha3_256_hash":"d2a5572df0c6d6022519615b76c9e6ca5bce0e7d5cf859ec145cbf99a437b8b0","size":137832},{"id":8808,"version_id":304,"filename":"ppo-Pendulum-v1/_stable_baselines3_version","sha3_256_hash":"pending-verification","size":7},{"id":8809,"version_id":304,"filename":"ppo-Pendulum-v1/data","sha3_256_hash":"pending-verification","size":13856},{"id":8810,"version_id":304,"filename":"ppo-Pendulum-v1/policy.optimizer.pth","sha3_256_hash":"38a97ba3110e2c7500d7371d0b6d4cae11d9458e713b3558c89bf99b2f55872b","size":82160},{"id":8811,"version_id":304,"filename":"ppo-Pendulum-v1/policy.pth","sha3_256_hash":"be542f8bb454365173f9e4ea14ab68cabc11b968254a49fb0dbad55bed400c16","size":40382},{"id":8812,"version_id":304,"filename":"ppo-Pendulum-v1/pytorch_variables.pth","sha3_256_hash":"d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1","size":431},{"id":8813,"version_id":304,"filename":"ppo-Pendulum-v1/system_info.txt","sha3_256_hash":"pending-verification","size":266},{"id":8814,"version_id":304,"filename":"replay.mp4","sha3_256_hash":"cc4ccb77c13e09f524899e42ab016875f30055b24e76e4f43eca6047088e5f14","size":174142},{"id":8815,"version_id":304,"filename":"results.json","sha3_256_hash":"pending-verification","size":158},{"id":8816,"version_id":304,"filename":"train_eval_metrics.zip","sha3_256_hash":"690af8420de0d7622537e219353fd187a2691b8cf017e74df2f93166a8b7d477","size":15240}],"signatures":[{"id":761,"version_id":304,"signer_did":"did:quantamrkt:registry:shield-v1","algorithm":"ML-DSA-65","signature_hex":"0a340f298884092fddc58d09032cbc7767fdee4cd47d803bf3c21fb75b3b6c36","attestation_type":"registry","signed_at":"2026-04-20 22:04:14"}],"hndl":{"id":253,"model_id":305,"risk_level":"MEDIUM","risk_score":50,"shelf_life_years":7,"sensitivity":"reinforcement-learning","recommendation":"Monitor and prepare migration plan.","assessed_at":"2026-04-20 22:04:15"}}