openoker
/
ray


			
							12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260
							# --------------------------------------------------------------------
# BAZEL/Buildkite-CI test cases.
# --------------------------------------------------------------------

# To add new RLlib tests, first find the correct category of your new test
# within this file.

# All new tests - within their category - should be added alphabetically!
# Do not just add tests to the bottom of the file.

# Currently we have the following categories:

# - Learning tests/regression, tagged:
# -- "learning_tests_[discrete|continuous]": distinguish discrete
#    actions vs continuous actions.
# -- "crashing_cartpole" and "stateless_cartpole" to distinguish between
#    simple CartPole and more advanced variants of it.
# -- "ray_data": Tests that rely on ray_data.
# -- "learning_tests_with_ray_data": Learning tests that rely on ray_data.

# - Folder-bound tests, tagged with the name of the top-level dir:
#   - `env` directory tests.
#   - `evaluation` directory tests.
#   - `models` directory tests.
#   - `offline` directory tests.
#   - `policy` directory tests.
#   - `utils` directory tests.

# - Algorithm tests, tagged "algorithms_dir".

# - Tests directory (everything in rllib/tests/...), tagged: "tests_dir"

# - Examples directory (everything in rllib/examples/...), tagged: "examples"

# - Memory leak tests tagged "memory_leak_tests".

# Note: There is a special directory in examples: "documentation" which contains
# all code that is linked to from within the RLlib docs. This code is tested
# separately via the "documentation" tag.

# Additional tags are:
# - "team:rllib": Indicating that all tests in this file are the responsibility of
#   the RLlib Team.
# - "needs_gpu": Indicating that a test needs to have a GPU in order to run.
# - "gpu": Indicating that a test may (but doesn't have to) be run in the GPU
#   pipeline, defined in .buildkite/pipeline.gpu.yml.
# - "multi_gpu": Indicating that a test will definitely be run in the Large GPU
#   pipeline, defined in .buildkite/pipeline.gpu.large.yml.
# - "no_gpu": Indicating that a test should not be run in the GPU pipeline due
#   to certain incompatibilities.
# - "no_tf_eager_tracing": Exclude this test from tf-eager tracing tests.
# - "torch_only": Only run this test case with framework=torch.

# Our .buildkite/pipeline.yml and .buildkite/pipeline.gpu.yml files execute all
# these tests in n different jobs.

load("//bazel:python.bzl", "py_test_module_list")
load("//bazel:python.bzl", "doctest")

filegroup(
  name = "cartpole-v1_large",
  data = glob(["tests/data/cartpole/cartpole-v1_large/*.parquet"]),
  visibility = ["//visibility:public"],
)

doctest(
    files = glob(
        ["**/*.py"],
        exclude=[
            "**/examples/**",
            "**/tests/**",
            "**/test_*.py",
            # Exclude `tuned_examples` *.py files.
            "**/tuned_examples/**",
            # Deprecated modules
            "utils/window_stat.py",
            "utils/timer.py",
            "utils/memory.py",
            "offline/off_policy_estimator.py",
            "offline/estimators/feature_importance.py",
            "env/wrappers/recsim_wrapper.py",
            "env/remote_vector_env.py",
            # Missing imports
            "algorithms/dreamerv3/**",
            # FIXME: These modules contain broken examples that weren't previously
            # tested.
            "algorithms/algorithm_config.py",
            "algorithms/alpha_star/alpha_star.py",
            "algorithms/r2d2/r2d2.py",
            "algorithms/sac/rnnsac.py",
            "algorithms/simple_q/simple_q.py",
            "core/models/base.py",
            "core/models/specs/specs_base.py",
            "core/models/specs/specs_dict.py",
            "env/wrappers/pettingzoo_env.py",
            "evaluation/collectors/sample_collector.py",
            "evaluation/episode.py",
            "evaluation/metrics.py",
            "evaluation/observation_function.py",
            "evaluation/postprocessing.py",
            "execution/buffers/mixin_replay_buffer.py",
            "models/base_model.py",
            "models/catalog.py",
            "models/preprocessors.py",
            "models/repeated_values.py",
            "models/tf/tf_distributions.py",
            "models/torch/model.py",
            "models/torch/torch_distributions.py",
            "policy/rnn_sequencing.py",
            "utils/actor_manager.py",
            "utils/filter.py",
            "utils/from_config.py",
            "utils/metrics/window_stat.py",
            "utils/nested_dict.py",
            "utils/pre_checks/env.py",
            "utils/replay_buffers/multi_agent_mixin_replay_buffer.py",
            "utils/spaces/space_utils.py"
        ]
    ),
    tags = ["team:rllib"],
    data = glob(["tests/data/cartpole/cartpole-v1_large/*.parquet"]),
    size = "enormous",
)

# --------------------------------------------------------------------
# Benchmarks
#
# Tag: benchmark
#
# This is smoke-testing the benchmark scripts.
# --------------------------------------------------------------------
py_test(
    name = "torch_compile_inference_bm",
    main = "benchmarks/torch_compile/run_inference_bm.py",
    tags = ["team:rllib", "exclusive", "benchmark", "torch_2.x_only_benchmark"],
    size = "small",
    srcs = ["benchmarks/torch_compile/run_inference_bm.py"],
    args = ["--smoke-test"]
)

py_test(
    name = "torch_compile_ppo_with_inference",
    main = "benchmarks/torch_compile/run_ppo_with_inference_bm.py",
    tags = ["team:rllib", "exclusive", "benchmark", "torch_2.x_only_benchmark"],
    size = "medium",
    srcs = ["benchmarks/torch_compile/run_ppo_with_inference_bm.py"],
    args = ["--smoke-test"]
)


# --------------------------------------------------------------------
# Algorithms learning regression tests.
#
# Tag: learning_tests
#
# This will test python/yaml config files
# inside rllib/tuned_examples/[algo-name] for actual learning success.
# --------------------------------------------------------------------

# APPO
# CartPole
py_test(
    name = "learning_tests_cartpole_appo",
    main = "tuned_examples/appo/cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/appo/cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_cartpole_appo_gpu",
    main = "tuned_examples/appo/cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/appo/cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_cartpole_appo_multi_cpu",
    main = "tuned_examples/appo/cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/appo/cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_cartpole_appo_multi_gpu",
    main = "tuned_examples/appo/cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/appo/cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentCartPole
py_test(
    name = "learning_tests_multi_agent_cartpole_appo",
    main = "tuned_examples/appo/multi_agent_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/appo/multi_agent_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_appo_gpu",
    main = "tuned_examples/appo/multi_agent_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/appo/multi_agent_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1", "--num-cpus=6"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_appo_multi_cpu",
    main = "tuned_examples/appo/multi_agent_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/appo/multi_agent_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2", "--num-cpus=7"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_appo_multi_gpu",
    main = "tuned_examples/appo/multi_agent_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/appo/multi_agent_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2", "--num-cpus=7"]
)
# StatelessCartPole
py_test(
    name = "learning_tests_stateless_cartpole_appo",
    main = "tuned_examples/appo/stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/appo/stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_stateless_cartpole_appo_gpu",
    main = "tuned_examples/appo/stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/appo/stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_stateless_cartpole_appo_multi_cpu",
    main = "tuned_examples/appo/stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/appo/stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_stateless_cartpole_appo_multi_gpu",
    main = "tuned_examples/appo/stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/appo/stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentStatelessCartPole
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_appo",
    main = "tuned_examples/appo/multi_agent_stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/appo/multi_agent_stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_appo_gpu",
    main = "tuned_examples/appo/multi_agent_stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/appo/multi_agent_stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_appo_multi_cpu",
    main = "tuned_examples/appo/multi_agent_stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "enormous",
    srcs = ["tuned_examples/appo/multi_agent_stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_appo_multi_gpu",
    main = "tuned_examples/appo/multi_agent_stateless_cartpole_appo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "enormous",
    srcs = ["tuned_examples/appo/multi_agent_stateless_cartpole_appo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)

#@OldAPIStack
py_test(
    name = "learning_tests_cartpole_separate_losses_appo_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "torch_only", "exclusive", "learning_tests", "learning_tests_discrete"],
    size = "medium",
    srcs = ["tests/run_regression_tests.py"],
    data = [
        "tuned_examples/appo/cartpole-appo-separate-losses.py"
    ],
    args = ["--dir=tuned_examples/appo"]
)

#@OldAPIStack
py_test(
    name = "learning_tests_multi_agent_cartpole_appo_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete"],
    size = "large",
    srcs = ["tests/run_regression_tests.py"],
    data = ["tuned_examples/appo/multi_agent_cartpole_appo_old_api_stack.py"],
    args = ["--dir=tuned_examples/appo"]
)

#@OldAPIStack
py_test(
    name = "learning_tests_multi_agent_cartpole_w_100_policies_appo_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "enormous",
    srcs = ["tests/run_regression_tests.py"],
    data = ["tuned_examples/appo/multi-agent-cartpole-w-100-policies-appo.py"],
    args = ["--dir=tuned_examples/appo"]
)

# BC
# CartPole
py_test(
    name = "learning_tests_cartpole_bc",
    main = "tuned_examples/bc/cartpole_bc.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "medium",
    srcs = ["tuned_examples/bc/cartpole_bc.py"],
    # Include the offline data files.
    data = [
        "tests/data/cartpole/cartpole-v1_large",
    ],
    args = ["--as-test", "--enable-new-api-stack"]
)

# CQL
# Pendulum
py_test(
    name = "learning_tests_pendulum_cql",
    main = "tuned_examples/cql/pendulum_cql.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_cartpole", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/cql/pendulum_cql.py"],
    # Include the zipped json data file as well.
    data = [
        "tests/data/pendulum/pendulum-v1_enormous",
    ],
    args = ["--as-test", "--enable-new-api-stack"]
)

# DQN
# CartPole
py_test(
    name = "learning_tests_cartpole_dqn",
    main = "tuned_examples/dqn/cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/dqn/cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack"]
)
py_test(
    name = "learning_tests_cartpole_dqn_gpu",
    main = "tuned_examples/dqn/cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/dqn/cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_cartpole_dqn_multi_cpu",
    main = "tuned_examples/dqn/cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/dqn/cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_cartpole_dqn_multi_gpu",
    main = "tuned_examples/dqn/cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/dqn/cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentCartPole
py_test(
    name = "learning_tests_multi_agent_cartpole_dqn",
    main = "tuned_examples/dqn/multi_agent_cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/dqn/multi_agent_cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-cpus=4"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_dqn_gpu",
    main = "tuned_examples/dqn/multi_agent_cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/dqn/multi_agent_cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-cpus=4", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_dqn_multi_cpu",
    main = "tuned_examples/dqn/multi_agent_cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/dqn/multi_agent_cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-cpus=5", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_dqn_multi_gpu",
    main = "tuned_examples/dqn/multi_agent_cartpole_dqn.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/dqn/multi_agent_cartpole_dqn.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-cpus=4", "--num-gpus=2"]
)

# IMPALA
# CartPole
py_test(
    name = "learning_tests_cartpole_impala",
    main = "tuned_examples/impala/cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/impala/cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_cartpole_impala_gpu",
    main = "tuned_examples/impala/cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/impala/cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_cartpole_impala_multi_cpu",
    main = "tuned_examples/impala/cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/impala/cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_cartpole_impala_multi_gpu",
    main = "tuned_examples/impala/cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/impala/cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentCartPole
py_test(
    name = "learning_tests_multi_agent_cartpole_impala",
    main = "tuned_examples/impala/multi_agent_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/impala/multi_agent_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1", "--num-cpus=6"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_impala_gpu",
    main = "tuned_examples/impala/multi_agent_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/impala/multi_agent_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1", "--num-cpus=6"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_impala_multi_cpu",
    main = "tuned_examples/impala/multi_agent_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "enormous",
    srcs = ["tuned_examples/impala/multi_agent_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2", "--num-cpus=7"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_impala_multi_gpu",
    main = "tuned_examples/impala/multi_agent_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/impala/multi_agent_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2", "--num-cpus=7"]
)
# StatelessCartPole
py_test(
    name = "learning_tests_stateless_cartpole_impala",
    main = "tuned_examples/impala/stateless_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/impala/stateless_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_stateless_cartpole_impala_multi_gpu",
    main = "tuned_examples/impala/stateless_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/impala/stateless_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentStatelessCartPole
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_impala",
    main = "tuned_examples/impala/multi_agent_stateless_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/impala/multi_agent_stateless_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_impala_multi_gpu",
    main = "tuned_examples/impala/multi_agent_stateless_cartpole_impala.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/impala/multi_agent_stateless_cartpole_impala.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)

#@OldAPIstack
py_test(
    name = "learning_tests_cartpole_separate_losses_impala_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete"],
    size = "medium",
    srcs = ["tests/run_regression_tests.py"],
    data = [
        "tuned_examples/impala/cartpole-impala-separate-losses.py"
    ],
    args = ["--dir=tuned_examples/impala"]
)
#@OldAPIStack
py_test(
    name = "learning_tests_multi_agent_cartpole_impala_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete"],
    size = "medium",
    srcs = ["tests/run_regression_tests.py"],
    data = ["tuned_examples/impala/multi_agent_cartpole_impala_old_api_stack.py"],
    args = ["--dir=tuned_examples/impala"]
)

# MARWIL
# CartPole
py_test(
    name = "learning_tests_cartpole_marwil",
    main = "tuned_examples/marwil/cartpole_marwil.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/marwil/cartpole_marwil.py"],
    # Include the offline data files.
    data = [
        "tests/data/cartpole/cartpole-v1_large",
    ],
    args = ["--as-test", "--enable-new-api-stack"]
)

# PPO
# CartPole
py_test(
    name = "learning_tests_cartpole_ppo",
    main = "tuned_examples/ppo/cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/ppo/cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack"]
)
py_test(
    name = "learning_tests_cartpole_ppo_gpu",
    main = "tuned_examples/ppo/cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_cartpole_ppo_multi_cpu",
    main = "tuned_examples/ppo/cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/ppo/cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_cartpole_ppo_multi_gpu",
    main = "tuned_examples/ppo/cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentCartPole
py_test(
    name = "learning_tests_multi_agent_cartpole_ppo",
    main = "tuned_examples/ppo/multi_agent_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_ppo_gpu",
    main = "tuned_examples/ppo/multi_agent_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_ppo_multi_cpu",
    main = "tuned_examples/ppo/multi_agent_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_multi_agent_cartpole_ppo_multi_gpu",
    main = "tuned_examples/ppo/multi_agent_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)
# CartPole (truncated)
py_test(
    name = "learning_tests_cartpole_truncated_ppo",
    main = "tuned_examples/ppo/cartpole_truncated_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/ppo/cartpole_truncated_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack"]
)
# StatelessCartPole
py_test(
    name = "learning_tests_stateless_cartpole_ppo",
    main = "tuned_examples/ppo/stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/ppo/stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack"]
)
py_test(
    name = "learning_tests_stateless_cartpole_ppo_gpu",
    main = "tuned_examples/ppo/stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_stateless_cartpole_ppo_multi_cpu",
    main = "tuned_examples/ppo/stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/ppo/stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_stateless_cartpole_ppo_multi_gpu",
    main = "tuned_examples/ppo/stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentStatelessCartPole
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_ppo",
    main = "tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2"]
)
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_ppo_gpu",
    main = "tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_ppo_multi_cpu",
    main = "tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_multi_agent_stateless_cartpole_ppo_multi_gpu",
    main = "tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_discrete", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_stateless_cartpole_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)
# Pendulum
py_test(
    name = "learning_tests_pendulum_ppo",
    main = "tuned_examples/ppo/pendulum_ppo.py",
    tags = ["torch_only", "team:rllib", "exclusive", "learning_tests", "learning_tests_continuous"],
    size = "large",
    srcs = ["tuned_examples/ppo/pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack"]
)
py_test(
    name = "learning_tests_pendulum_ppo_gpu",
    main = "tuned_examples/ppo/pendulum_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_pendulum_ppo_multi_cpu",
    main = "tuned_examples/ppo/pendulum_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/ppo/pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_pendulum_ppo_multi_gpu",
    main = "tuned_examples/ppo/pendulum_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentPendulum
py_test(
    name = "learning_tests_multi_agent_pendulum_ppo",
    main = "tuned_examples/ppo/multi_agent_pendulum_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_continuous", "torch_only"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2"]
)
py_test(
    name = "learning_tests_multi_agent_pendulum_ppo_gpu",
    main = "tuned_examples/ppo/multi_agent_pendulum_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "learning_tests_pytorch_use_all_core", "gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_pendulum_ppo_multi_cpu",
    main = "tuned_examples/ppo/multi_agent_pendulum_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "learning_tests_pytorch_use_all_core"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_multi_agent_pendulum_ppo_multi_gpu",
    main = "tuned_examples/ppo/multi_agent_pendulum_ppo.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "learning_tests_pytorch_use_all_core", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/ppo/multi_agent_pendulum_ppo.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)

#@OldAPIStack
py_test(
    name = "learning_tests_pendulum_ppo_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_continuous", "no_tf_static_graph"],
    size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
    srcs = ["tests/run_regression_tests.py"],
    data = ["tuned_examples/ppo/pendulum-ppo.yaml"],
    args = ["--dir=tuned_examples/ppo"]
)
#@OldAPIStack
py_test(
    name = "learning_tests_transformed_actions_pendulum_ppo_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_continuous", "no_tf_static_graph"],
    size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
    srcs = ["tests/run_regression_tests.py"],
    data = ["tuned_examples/ppo/pendulum-transformed-actions-ppo.yaml"],
    args = ["--dir=tuned_examples/ppo"]
)
#@OldAPIStack
py_test(
    name = "learning_tests_repeat_after_me_ppo_old_api_stack",
    main = "tests/run_regression_tests.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "learning_tests_discrete"],
    size = "medium",
    srcs = ["tests/run_regression_tests.py"],
    data = ["tuned_examples/ppo/repeatafterme-ppo-lstm.yaml"],
    args = ["--dir=tuned_examples/ppo"]
)

# SAC
# Pendulum
py_test(
    name = "learning_tests_pendulum_sac",
    main = "tuned_examples/sac/pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous"],
    size = "large",
    srcs = ["tuned_examples/sac/pendulum_sac.py"],
    args = ["--as-test", "--enable-new-api-stack"]
)
py_test(
    name = "learning_tests_pendulum_sac_gpu",
    main = "tuned_examples/sac/pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "gpu"],
    size = "large",
    srcs = ["tuned_examples/sac/pendulum_sac.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_pendulum_sac_multi_cpu",
    main = "tuned_examples/sac/pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous"],
    size = "large",
    srcs = ["tuned_examples/sac/pendulum_sac.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_pendulum_sac_multi_gpu",
    main = "tuned_examples/sac/pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/sac/pendulum_sac.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-gpus=2"]
)
# MultiAgentPendulum
py_test(
    name = "learning_tests_multi_agent_pendulum_sac",
    main = "tuned_examples/sac/multi_agent_pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous"],
    size = "large",
    srcs = ["tuned_examples/sac/multi_agent_pendulum_sac.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-cpus=4"]
)
py_test(
    name = "learning_tests_multi_agent_pendulum_sac_gpu",
    main = "tuned_examples/sac/multi_agent_pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "gpu"],
    size = "large",
    srcs = ["tuned_examples/sac/multi_agent_pendulum_sac.py"],
    args = ["--as-test", "--enable-new-api-stack", "--num-agents=2", "--num-cpus=4", "--num-gpus=1"]
)
py_test(
    name = "learning_tests_multi_agent_pendulum_sac_multi_cpu",
    main = "tuned_examples/sac/multi_agent_pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous"],
    size = "large",
    srcs = ["tuned_examples/sac/multi_agent_pendulum_sac.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)
py_test(
    name = "learning_tests_multi_agent_pendulum_sac_multi_gpu",
    main = "tuned_examples/sac/multi_agent_pendulum_sac.py",
    tags = ["team:rllib", "exclusive", "learning_tests", "torch_only", "learning_tests_continuous", "multi_gpu"],
    size = "large",
    srcs = ["tuned_examples/sac/multi_agent_pendulum_sac.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--num-gpus=2"]
)

# --------------------------------------------------------------------
# Algorithms (Compilation, Losses, simple functionality tests)
# rllib/algorithms/
#
# Tag: algorithms_dir
# --------------------------------------------------------------------

# Generic (all Algorithms)

py_test(
    name = "test_algorithm",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "large",
    srcs = ["algorithms/tests/test_algorithm.py"],
    data = ["tests/data/cartpole/small.json"],
)

py_test(
    name = "test_algorithm_config",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "medium",
    srcs = ["algorithms/tests/test_algorithm_config.py"],
)

py_test(
    name = "test_algorithm_export_checkpoint",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "medium",
    srcs = ["algorithms/tests/test_algorithm_export_checkpoint.py"],
)

py_test(
    name ="test_algorithm_save_load_checkpoint_learner",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "medium",
    srcs = ["algorithms/tests/test_algorithm_save_load_checkpoint_learner.py"]
)

py_test(
    name="test_algorithm_rl_module_restore",
    tags=["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size="large",
    srcs=["algorithms/tests/test_algorithm_rl_module_restore.py"]
)

py_test(
    name = "test_algorithm_imports",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "small",
    srcs = ["algorithms/tests/test_algorithm_imports.py"]
)

py_test(
    name = "test_callbacks_on_algorithm",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "large",
    srcs = ["algorithms/tests/test_callbacks_on_algorithm.py"]
)
py_test(
    name = "test_callbacks_on_env_runner",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "medium",
    srcs = ["algorithms/tests/test_callbacks_on_env_runner.py"]
)
# @OldAPIStack
py_test(
    name = "test_callbacks_old_api_stack",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "medium",
    srcs = ["algorithms/tests/test_callbacks_old_api_stack.py"]
)

py_test(
    name = "test_registry",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic"],
    size = "small",
    srcs = ["algorithms/tests/test_registry.py"],
)

py_test(
    name = "test_env_runner_failures",
    tags = ["team:rllib", "algorithms_dir", "algorithms_dir_generic", "exclusive"],
    size = "large",
    srcs = ["algorithms/tests/test_env_runner_failures.py"]
)

py_test(
    name = "test_node_failures",
    tags = ["team:rllib", "tests_dir", "exclusive"],
    size = "large",
    srcs = ["algorithms/tests/test_node_failures.py"],
)


# Specific Algorithms

# APPO
# @OldAPIStack
py_test(
    name = "test_appo",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/appo/tests/test_appo.py"]
)
py_test(
    name = "test_appo_learner",
    tags = ["team:rllib", "algorithms_dir"],
    size = "medium",
    srcs = ["algorithms/appo/tests/test_appo_learner.py"]
)

# BC
py_test(
    name = "test_bc",
    tags = ["team:rllib", "algorithms_dir"],
    size = "medium",
    # Include the offline data files.
    data = ["tests/data/cartpole/cartpole-v1_large"],
    srcs = ["algorithms/bc/tests/test_bc.py"]
)
# @OldAPIStack
py_test(
    name = "test_bc_old_api_stack",
    tags = ["team:rllib", "algorithms_dir"],
    size = "medium",
    # Include the json data file.
    data = ["tests/data/cartpole/large.json"],
    srcs = ["algorithms/bc/tests/test_bc_old_api_stack.py"]
)

# CQL
py_test(
    name = "test_cql",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    data = ["tests/data/pendulum/small.json"],
    srcs = ["algorithms/cql/tests/test_cql.py"]
)

# DQN
py_test(
    name = "test_dqn",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/dqn/tests/test_dqn.py"]
)

# DreamerV3
py_test(
    name = "test_dreamerv3",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/dreamerv3/tests/test_dreamerv3.py"]
)

# IMPALA
py_test(
    name = "test_impala",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/impala/tests/test_impala.py"]
)
py_test(
    name = "test_vtrace_v2",
    tags = ["team:rllib", "algorithms_dir"],
    size = "small",
    srcs = ["algorithms/impala/tests/test_vtrace_v2.py"]
)
# @OldAPIStack
py_test(
    name = "test_vtrace_old_api_stack",
    tags = ["team:rllib", "algorithms_dir"],
    size = "small",
    srcs = ["algorithms/impala/tests/test_vtrace_old_api_stack.py"]
)

# MARWIL
py_test(
    name = "test_marwil",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    # Include the offline data files.
    data = [
        "tests/data/cartpole/cartpole-v1_large",
        "tests/data/pendulum/pendulum-v1_large",
    ],
    srcs = ["algorithms/marwil/tests/test_marwil.py"]
)
py_test(
    name = "test_marwil_rl_module",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    # Include the json data file.
    data = [
        "tests/data/cartpole/large.json",
    ],
    srcs = ["algorithms/marwil/tests/test_marwil_rl_module.py"]
)
# @OldAPIStack
py_test(
    name = "test_marwil_old_api_stack",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    # Include the json data file.
    data = [
        "tests/data/cartpole/large.json",
        "tests/data/pendulum/large.json",
        "tests/data/cartpole/small.json",
    ],
    srcs = ["algorithms/marwil/tests/test_marwil_old_api_stack.py"]
)

# PPO
py_test(
    name = "test_ppo",
    tags = ["team:rllib", "algorithms_dir"],
    size = "medium",
    srcs = ["algorithms/ppo/tests/test_ppo.py"]
)
py_test(
    name = "test_ppo_rl_module",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/ppo/tests/test_ppo_rl_module.py"]
)
py_test(
    name = "test_ppo_learner",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/ppo/tests/test_ppo_learner.py"]
)
# @OldAPIStack
py_test(
    name = "test_ppo_old_api_stack",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/ppo/tests/test_ppo_old_api_stack.py"]
)

# SAC
py_test(
    name = "test_sac",
    tags = ["team:rllib", "algorithms_dir"],
    size = "large",
    srcs = ["algorithms/sac/tests/test_sac.py"]
)

# --------------------------------------------------------------------
# Memory leak tests
#
# Tag: memory_leak_tests
# --------------------------------------------------------------------

# @OldAPIStack
py_test(
    name = "test_memory_leak_appo_old_api_stack",
    tags = ["team:rllib", "memory_leak_tests"],
    main = "utils/tests/run_memory_leak_tests.py",
    size = "large",
    srcs = ["utils/tests/run_memory_leak_tests.py"],
    data = ["tuned_examples/appo/memory-leak-test-appo.yaml"],
    args = ["--dir=tuned_examples/appo"]
)
# @OldAPIStack
py_test(
    name = "test_memory_leak_impala_old_api_stack",
    tags = ["team:rllib", "memory_leak_tests"],
    main = "utils/tests/run_memory_leak_tests.py",
    size = "large",
    srcs = ["utils/tests/run_memory_leak_tests.py"],
    data = ["tuned_examples/impala/memory-leak-test-impala.yaml"],
    args = ["--dir=tuned_examples/impala"]
)
# @OldAPIStack
py_test(
    name = "test_memory_leak_ppo_old_api_stack",
    tags = ["team:rllib", "memory_leak_tests"],
    main = "utils/tests/run_memory_leak_tests.py",
    size = "large",
    srcs = ["utils/tests/run_memory_leak_tests.py"],
    data = ["tuned_examples/ppo/memory-leak-test-ppo.yaml"],
    args = ["--dir=tuned_examples/ppo"]
)


# --------------------------------------------------------------------
# Connector(V1) tests
# rllib/connector/
#
# Tag: connector
# --------------------------------------------------------------------

py_test(
    name = "connectors/tests/test_connector",
    tags = ["team:rllib", "connector"],
    size = "small",
    srcs = ["connectors/tests/test_connector.py"]
)

py_test(
    name = "connectors/tests/test_action",
    tags = ["team:rllib", "connector"],
    size = "small",
    srcs = ["connectors/tests/test_action.py"]
)

py_test(
    name = "connectors/tests/test_agent",
    tags = ["team:rllib", "connector"],
    size = "medium",
    srcs = ["connectors/tests/test_agent.py"]
)

# --------------------------------------------------------------------
# ConnectorV2 tests
# rllib/connector/
#
# Tag: connector_v2
# --------------------------------------------------------------------

# TODO (sven): Add these tests in a separate PR.
# py_test(
#    name = "connectors/tests/test_connector_v2",
#    tags = ["team:rllib", "connector_v2"],
#    size = "small",
#    srcs = ["connectors/tests/test_connector_v2.py"]
# )

# --------------------------------------------------------------------
# Env tests
# rllib/env/
#
# Tag: env
# --------------------------------------------------------------------

py_test(
    name = "env/tests/test_infinite_lookback_buffer",
    tags = ["team:rllib", "env"],
    size = "small",
    srcs = ["env/tests/test_infinite_lookback_buffer.py"]
)

# CI all of a sudden has problems with accessing the ports.
# sh_test(
#    name = "env/tests/test_local_inference_cartpole",
#    tags = ["team:rllib", "env"],
#    size = "medium",
#    srcs = ["env/tests/test_policy_client_server_setup.sh"],
#    args = ["local", "cartpole", "8800"],
#    data = glob(["examples/envs/external_envs/*.py"]),
# )

# sh_test(
#    name = "env/tests/test_local_inference_cartpole_w_2_concurrent_episodes",
#    tags = ["team:rllib", "env"],
#    size = "medium",
#    srcs = ["env/tests/test_policy_client_server_setup.sh"],
#    args = ["local", "cartpole-dummy-2-episodes", "8830"],
#    data = glob(["examples/envs/external_envs/*.py"]),
# )

# Tests with unity 3d and external envs currently don't work
# see: https://github.com/ray-project/ray/issues/34290 for more details
# sh_test(
#     name = "env/tests/test_local_inference_unity3d",
#     tags = ["team:rllib", "env"],
#     size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
#     srcs = ["env/tests/test_policy_client_server_setup.sh"],
#     args = ["local", "unity3d", "8850"],
#     data = glob(["examples/envs/external_envs/*.py"]),
# )

py_test(
    name = "env/tests/test_multi_agent_env",
    tags = ["team:rllib", "tests_dir"],
    size = "large",
    srcs = ["env/tests/test_multi_agent_env.py"]
)

py_test(
    name = "env/tests/test_multi_agent_env_runner",
    tags = ["team:rllib", "env"],
    size = "medium",
    srcs = ["env/tests/test_multi_agent_env_runner.py"]
)

py_test(
    name = "env/tests/test_multi_agent_episode",
    tags = ["team:rllib", "env"],
    size = "medium",
    srcs = ["env/tests/test_multi_agent_episode.py"]
)

# CI all of a sudden has problems with accessing the ports.
# sh_test(
#    name = "env/tests/test_remote_inference_cartpole",
#    tags = ["team:rllib", "env", "exclusive"],
#    size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
#    srcs = ["env/tests/test_policy_client_server_setup.sh"],
#    args = ["remote", "cartpole", "8810"],
#    data = glob(["examples/envs/external_envs/*.py"]),
# )

# sh_test(
#    name = "env/tests/test_remote_inference_cartpole_lstm",
#    tags = ["team:rllib", "env", "exclusive"],
#    size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
#    srcs = ["env/tests/test_policy_client_server_setup.sh"],
#    args = ["remote", "cartpole_lstm", "8820"],
#    data = glob(["examples/envs/external_envs/*.py"]),
# )

# sh_test(
#    name = "env/tests/test_remote_inference_cartpole_w_2_concurrent_episodes",
#    tags = ["team:rllib", "env", "exclusive"],
#    size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
#    srcs = ["env/tests/test_policy_client_server_setup.sh"],
#    args = ["remote", "cartpole-dummy-2-episodes", "8840"],
#    data = glob(["examples/envs/external_envs/*.py"]),
# )

# Tests with unity 3d and external envs currently don't work
# see: https://github.com/ray-project/ray/issues/34290 for more details
# sh_test(
#     name = "env/tests/test_remote_inference_unity3d",
#     tags = ["team:rllib", "env", "exclusive"],
#     size = "small",
#     srcs = ["env/tests/test_policy_client_server_setup.sh"],
#     args = ["remote", "unity3d", "8860"],
#     data = glob(["examples/envs/external_envs/*.py"]),
# )

py_test(
    name = "env/tests/test_single_agent_env_runner",
    tags = ["team:rllib", "env"],
    size = "medium",
    srcs = ["env/tests/test_single_agent_env_runner.py"]
)

py_test(
    name = "env/tests/test_single_agent_episode",
    tags = ["team:rllib", "env"],
    size = "small",
    srcs = ["env/tests/test_single_agent_episode.py"]
)

py_test(
    name = "env/wrappers/tests/test_exception_wrapper",
    tags = ["team:rllib", "env"],
    size = "small",
    srcs = ["env/wrappers/tests/test_exception_wrapper.py"]
)

py_test(
    name = "env/wrappers/tests/test_group_agents_wrapper",
    tags = ["team:rllib", "env"],
    size = "small",
    srcs = ["env/wrappers/tests/test_group_agents_wrapper.py"]
)

py_test(
    name = "env/wrappers/tests/test_unity3d_env",
    tags = ["team:rllib", "env"],
    size = "small",
    srcs = ["env/wrappers/tests/test_unity3d_env.py"]
)

# --------------------------------------------------------------------
# Evaluation components
# rllib/evaluation/
#
# Tag: evaluation
# --------------------------------------------------------------------
py_test(
    name = "env/tests/test_env_runner_group",
    tags = ["team:rllib", "evaluation", "exclusive"],
    size = "small",
    srcs = ["env/tests/test_env_runner_group.py"]
)

# @OldAPIStack
py_test(
    name = "evaluation/tests/test_agent_collector",
    tags = ["team:rllib", "evaluation"],
    size = "small",
    srcs = ["evaluation/tests/test_agent_collector.py"]
)

# @OldAPIStack
py_test(
    name = "evaluation/tests/test_env_runner_v2",
    tags = ["team:rllib", "evaluation"],
    size = "small",
    srcs = ["evaluation/tests/test_env_runner_v2.py"]
)

# @OldAPIStack
py_test(
    name = "evaluation/tests/test_episode",
    tags = ["team:rllib", "evaluation"],
    size = "small",
    srcs = ["evaluation/tests/test_episode.py"]
)

# @OldAPIStack
py_test(
    name = "evaluation/tests/test_episode_v2",
    tags = ["team:rllib", "evaluation"],
    size = "small",
    srcs = ["evaluation/tests/test_episode_v2.py"]
)

# @OldAPIStack
py_test(
    name = "evaluation/tests/test_postprocessing",
    tags = ["team:rllib", "evaluation"],
    size = "small",
    srcs = ["evaluation/tests/test_postprocessing.py"]
)

# @OldAPIStack
py_test(
    name = "evaluation/tests/test_rollout_worker",
    tags = ["team:rllib", "evaluation", "exclusive"],
    size = "large",
    srcs = ["evaluation/tests/test_rollout_worker.py"]
)

# --------------------------------------------------------------------
# RLlib core
# rllib/core/
#
# Tag: core
# --------------------------------------------------------------------

# Catalog
py_test(
    name = "test_catalog",
    tags = ["team:rllib", "core"],
    size = "medium",
    srcs = ["core/models/tests/test_catalog.py"]
)

# Default Models
py_test(
    name = "test_base_models",
    tags = ["team:rllib", "core"],
    size = "small",
    srcs = ["core/models/tests/test_base_models.py"]
)

py_test(
    name = "test_cnn_encoders",
    tags = ["team:rllib", "core", "models"],
    size = "large",
    srcs = ["core/models/tests/test_cnn_encoders.py"]
)

py_test(
    name = "test_cnn_transpose_heads",
    tags = ["team:rllib", "core", "models"],
    size = "medium",
    srcs = ["core/models/tests/test_cnn_transpose_heads.py"]
)

py_test(
    name = "test_mlp_encoders",
    tags = ["team:rllib", "core", "models"],
    size = "medium",
    srcs = ["core/models/tests/test_mlp_encoders.py"]
)

py_test(
    name = "test_mlp_heads",
    tags = ["team:rllib", "core", "models"],
    size = "medium",
    srcs = ["core/models/tests/test_mlp_heads.py"]
)

py_test(
    name = "test_recurrent_encoders",
    tags = ["team:rllib", "core", "models"],
    size = "medium",
    srcs = ["core/models/tests/test_recurrent_encoders.py"]
)

# RLModule
py_test(
    name = "test_torch_rl_module",
    tags = ["team:rllib", "core"],
    size = "medium",
    srcs = ["core/rl_module/torch/tests/test_torch_rl_module.py"],
    args = ["TestRLModule"],
)

# TODO(Artur): Comment this back in as soon as we can test with GPU
# py_test(
#    name = "test_torch_rl_module_gpu",
#    main = "core/rl_module/torch/tests/test_torch_rl_module.py",
#    tags = ["team:rllib", "core", "gpu", "exclusive"],
#    size = "medium",
#    srcs = ["core/rl_module/torch/tests/test_torch_rl_module.py"],
#    args = ["TestRLModuleGPU"],
# )

py_test(
    name = "test_tf_rl_module",
    tags = ["team:rllib", "core"],
    size = "medium",
    srcs = ["core/rl_module/tf/tests/test_tf_rl_module.py"]
)

py_test(
    name = "test_multi_rl_module",
    tags = ["team:rllib", "core"],
    size = "medium",
    srcs = ["core/rl_module/tests/test_multi_rl_module.py"]
)

py_test(
    name = "test_rl_module_specs",
    tags = ["team:rllib", "core"],
    size = "medium",
    srcs = ["core/rl_module/tests/test_rl_module_specs.py"]
)

# Learner
py_test(
    name = "TestLearnerGroupSyncUpdate",
    main = "core/learner/tests/test_learner_group.py",
    tags = ["team:rllib", "multi_gpu", "exclusive"],
    size = "large",
    srcs = ["core/learner/tests/test_learner_group.py"],
    args = ["TestLearnerGroupSyncUpdate"]
)

py_test(
    name = "TestLearnerGroupCheckpointRestore",
    main = "core/learner/tests/test_learner_group.py",
    tags = ["team:rllib", "multi_gpu", "exclusive"],
    size = "large",
    srcs = ["core/learner/tests/test_learner_group.py"],
    args = ["TestLearnerGroupCheckpointRestore"]
)

py_test(
    name = "TestLearnerGroupAsyncUpdate",
    main = "core/learner/tests/test_learner_group.py",
    tags = ["team:rllib", "multi_gpu", "exclusive"],
    size = "large",
    srcs = ["core/learner/tests/test_learner_group.py"],
    args = ["TestLearnerGroupAsyncUpdate"]
)

py_test(
    name = "TestLearnerGroupSaveLoadState",
    main = "core/learner/tests/test_learner_group.py",
    tags = ["team:rllib", "multi_gpu", "exclusive"],
    size = "large",
    srcs = ["core/learner/tests/test_learner_group.py"],
    args = ["TestLearnerGroupSaveLoadState"]
)

py_test(
    name = "test_learner",
    tags = ["team:rllib", "core", "ray_data"],
    size = "medium",
    srcs = ["core/learner/tests/test_learner.py"]
)

py_test(
    name = "test_torch_learner_compile",
    tags = ["team:rllib", "core", "ray_data"],
    size = "medium",
    srcs = ["core/learner/torch/tests/test_torch_learner_compile.py"]
)

# --------------------------------------------------------------------
# Models and Distributions
# rllib/models/
#
# Tag: models
# --------------------------------------------------------------------

py_test(
    name = "test_attention_nets",
    tags = ["team:rllib", "models"],
    size = "large",
    srcs = ["models/tests/test_attention_nets.py"]
)

py_test(
    name = "test_conv2d_default_stacks",
    tags = ["team:rllib", "models"],
    size = "small",
    srcs = ["models/tests/test_conv2d_default_stacks.py"]
)

py_test(
    name = "test_convtranspose2d_stack",
    tags = ["team:rllib", "models"],
    size = "medium",
    data = glob(["tests/data/images/obstacle_tower.png"]),
    srcs = ["models/tests/test_convtranspose2d_stack.py"]
)

py_test(
    name = "test_action_distributions",
    tags = ["team:rllib", "models"],
    size = "medium",
    srcs = ["models/tests/test_action_distributions.py"]
)

py_test(
    name = "test_distributions",
    tags = ["team:rllib", "models"],
    size = "small",
    srcs = ["models/tests/test_distributions.py"]
)

py_test(
    name = "test_lstms",
    tags = ["team:rllib", "models"],
    size = "large",
    srcs = ["models/tests/test_lstms.py"]
)

py_test(
    name = "test_models",
    tags = ["team:rllib", "models"],
    size = "medium",
    srcs = ["models/tests/test_models.py"]
)

py_test(
    name = "test_preprocessors",
    tags = ["team:rllib", "models"],
    size = "medium",
    srcs = ["models/tests/test_preprocessors.py"]
)


# --------------------------------------------------------------------
# Offline
# rllib/offline/
#
# Tag: offline
# --------------------------------------------------------------------

py_test(
    name = "test_dataset_reader",
    tags = ["team:rllib", "offline"],
    size = "small",
    srcs = ["offline/tests/test_dataset_reader.py"],
    data = [
        "tests/data/pendulum/large.json",
        "tests/data/pendulum/enormous.zip",
    ],
)

py_test(
    name = "test_feature_importance",
    tags = ["team:rllib", "offline", "torch_only"],
    size = "medium",
    srcs = ["offline/tests/test_feature_importance.py"]
)

py_test(
    name = "test_json_reader",
    tags = ["team:rllib", "offline"],
    size = "small",
    srcs = ["offline/tests/test_json_reader.py"],
    data = ["tests/data/pendulum/large.json"],
)

py_test(
    name = "test_ope",
    tags = ["team:rllib", "offline", "ray_data"],
    size = "medium",
    srcs = ["offline/estimators/tests/test_ope.py"],
    data = ["tests/data/cartpole/small.json"],
)

py_test(
    name = "test_ope_math",
    tags = ["team:rllib", "offline"],
    size = "small",
    srcs = ["offline/estimators/tests/test_ope_math.py"]
)

py_test(
    name = "test_dm_learning",
    tags = ["team:rllib", "offline"],
    size = "large",
    srcs = ["offline/estimators/tests/test_dm_learning.py"],
)

py_test(
    name = "test_dr_learning",
    tags = ["team:rllib", "offline"],
    size = "large",
    srcs = ["offline/estimators/tests/test_dr_learning.py"],
)

py_test(
    name = "test_offline_env_runner",
    tags = ["team:rllib", "offline"],
    size = "small",
    srcs = ["offline/tests/test_offline_env_runner.py"],
)

py_test(
    name = "test_offline_data",
    tags = ["team:rllib", "offline"],
    size = "medium",
    srcs = ["offline/tests/test_offline_data.py"],
    # Include the offline data files.
    data = [
        "tests/data/cartpole/cartpole-v1_large",
        "tests/data/cartpole/large.json",
    ]
)

py_test(
    name = "test_offline_prelearner",
    tags = ["team:rllib", "offline"],
    size = "medium",
    srcs = ["offline/tests/test_offline_prelearner.py"],
    # Include the offline data files.
    data = [
        "tests/data/cartpole/cartpole-v1_large",
        "tests/data/cartpole/large.json",
    ]
)

# --------------------------------------------------------------------
# Policies
# rllib/policy/
#
# Tag: policy
# --------------------------------------------------------------------

py_test(
    name = "policy/tests/test_compute_log_likelihoods",
    tags = ["team:rllib", "policy"],
    size = "medium",
    srcs = ["policy/tests/test_compute_log_likelihoods.py"]
)

py_test(
    name = "policy/tests/test_export_checkpoint_and_model",
    tags = ["team:rllib", "policy"],
    size = "large",
    srcs = ["policy/tests/test_export_checkpoint_and_model.py"]
)

py_test(
    name = "policy/tests/test_multi_agent_batch",
    tags = ["team:rllib", "policy"],
    size = "small",
    srcs = ["policy/tests/test_multi_agent_batch.py"]
)

py_test(
    name = "policy/tests/test_policy",
    tags = ["team:rllib", "policy"],
    size = "medium",
    srcs = ["policy/tests/test_policy.py"]
)

py_test(
    name = "policy/tests/test_policy_map",
    tags = ["team:rllib", "policy"],
    size = "medium",
    srcs = ["policy/tests/test_policy_map.py"]
)

py_test(
    name = "policy/tests/test_policy_state_swapping",
    tags = ["team:rllib", "policy", "gpu"],
    size = "medium",
    srcs = ["policy/tests/test_policy_state_swapping.py"]
)

py_test(
    name = "policy/tests/test_rnn_sequencing",
    tags = ["team:rllib", "policy"],
    size = "small",
    srcs = ["policy/tests/test_rnn_sequencing.py"]
)

py_test(
    name = "policy/tests/test_sample_batch",
    tags = ["team:rllib", "policy", "multi_gpu"],
    size = "small",
    srcs = ["policy/tests/test_sample_batch.py"]
)

py_test(
    name = "policy/tests/test_view_requirement",
    tags = ["team:rllib", "policy"],
    size = "small",
    srcs = ["policy/tests/test_view_requirement.py"]
)


# --------------------------------------------------------------------
# Utils:
# rllib/utils/
#
# Tag: utils
# --------------------------------------------------------------------

py_test(
    name = "test_errors",
    tags = ["team:rllib", "utils"],
    size = "medium",
    srcs = ["utils/tests/test_errors.py"]
)

py_test(
    name = "test_minibatch_utils",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/tests/test_minibatch_utils.py"]
)

py_test(
    name = "test_serialization",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/tests/test_serialization.py"]
)

py_test(
    name = "test_curiosity",
    tags = ["team:rllib", "utils"],
    size = "large",
    srcs = ["utils/exploration/tests/test_curiosity.py"]
)

py_test(
    name = "test_explorations",
    tags = ["team:rllib", "utils"],
    size = "large",
    srcs = ["utils/exploration/tests/test_explorations.py"]
)

py_test(
    name = "test_value_predictions",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/postprocessing/tests/test_value_predictions.py"]
)

py_test(
    name = "test_torch_utils",
    tags = ["team:rllib", "utils", "gpu"],
    size = "medium",
    srcs = ["utils/tests/test_torch_utils.py"]
)

# Schedules
py_test(
    name = "test_schedules",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/schedules/tests/test_schedules.py"]
)

py_test(
    name = "test_framework_agnostic_components",
    tags = ["team:rllib", "utils"],
    size = "small",
    data = glob(["utils/tests/**"]),
    srcs = ["utils/tests/test_framework_agnostic_components.py"]
)

# Spaces/Space utils.
py_test(
    name = "test_space_utils",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/spaces/tests/test_space_utils.py"]
)

# TaskPool
py_test(
    name = "test_taskpool",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/tests/test_taskpool.py"]
)

# ReplayBuffers
py_test(
    name = "test_episode_replay_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_episode_replay_buffer.py"]
)

py_test(
    name = "test_multi_agent_episode_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_multi_agent_episode_buffer.py"]
)

py_test(
    name = "test_multi_agent_mixin_replay_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_multi_agent_mixin_replay_buffer.py"]
)

py_test(
    name = "test_multi_agent_prio_episode_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_multi_agent_prio_episode_buffer.py"]
)

py_test(
    name = "test_multi_agent_prioritized_replay_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_multi_agent_prioritized_replay_buffer.py"]
)

py_test(
    name = "test_multi_agent_replay_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_multi_agent_replay_buffer.py"]
)

py_test(
    name = "test_prioritized_episode_buffer",
    tags = ["team::rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_prioritized_episode_buffer.py"]
)

py_test(
    name = "test_prioritized_replay_buffer_replay_buffer_api",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_prioritized_replay_buffer_replay_buffer_api.py"]
)

py_test(
    name = "test_replay_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_replay_buffer.py"]
)

py_test(
    name = "test_fifo_replay_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_fifo_replay_buffer.py"]
)

py_test(
    name = "test_reservoir_buffer",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_reservoir_buffer.py"]
)

py_test(
    name = "test_segment_tree_replay_buffer_api",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/replay_buffers/tests/test_segment_tree_replay_buffer_api.py"]
)

py_test(
    name = "test_check_multi_agent",
    tags = ["team:rllib", "utils"],
    size = "small",
    srcs = ["utils/tests/test_check_multi_agent.py"]
)

py_test(
    name = "test_actor_manager",
    tags = ["team:rllib", "utils", "exclusive"],
    size = "medium",
    srcs = ["utils/tests/test_actor_manager.py"],
    data = ["utils/tests/random_numbers.pkl"],
)

# --------------------------------------------------------------------
# rllib/tests/ directory
#
# Tag: tests_dir
#
# NOTE: Add tests alphabetically into this list.
# --------------------------------------------------------------------

py_test(
    name = "tests/test_catalog",
    tags = ["team:rllib", "tests_dir"],
    size = "medium",
    srcs = ["tests/test_catalog.py"]
)

py_test(
    name = "policy/tests/test_policy_checkpoint_restore",
    main = "policy/tests/test_policy_checkpoint_restore.py",
    tags = ["team:rllib", "tests_dir"],
    size = "large",
    data = glob([
        "tests/data/checkpoints/APPO_CartPole-v1-connector-enabled/**",
    ]),
    srcs = ["policy/tests/test_policy_checkpoint_restore.py"],
)

py_test(
    name = "tests/test_custom_resource",
    tags = ["team:rllib", "tests_dir"],
    size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
    srcs = ["tests/test_custom_resource.py"]
)

py_test(
    name = "tests/test_dependency_tf",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_dependency_tf.py"]
)

py_test(
    name = "tests/test_dependency_torch",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_dependency_torch.py"]
)

py_test(
    name = "tests/test_eager_support_policy_gradient",
    main = "tests/test_eager_support.py",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_eager_support.py"],
    args = ["TestEagerSupportPolicyGradient"]
)

py_test(
    name = "tests/test_eager_support_off_policy",
    main = "tests/test_eager_support.py",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_eager_support.py"],
    args = ["TestEagerSupportOffPolicy"]
)

py_test(
    name = "tests/test_filters",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_filters.py"]
)

py_test(
    name = "tests/test_gpus",
    tags = ["team:rllib", "tests_dir"],
    size = "large",
    srcs = ["tests/test_gpus.py"]
)

py_test(
    name = "tests/test_io",
    tags = ["team:rllib", "tests_dir"],
    size = "large",
    srcs = ["tests/test_io.py"]
)

py_test(
    name = "tests/test_local",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_local.py"]
)

py_test(
    name = "tests/test_lstm",
    tags = ["team:rllib", "tests_dir"],
    size = "medium",
    srcs = ["tests/test_lstm.py"]
)

py_test(
    name = "tests/test_nn_framework_import_errors",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_nn_framework_import_errors.py"]
)

py_test(
    name = "tests/test_pettingzoo_env",
    tags = ["team:rllib", "tests_dir"],
    size = "medium",
    srcs = ["tests/test_pettingzoo_env.py"]
)

py_test(
    name = "tests/test_placement_groups",
    tags = ["team:rllib", "tests_dir"],
    size = "large", # bazel may complain about it being too long sometimes - large is on purpose as some frameworks take longer
    srcs = ["tests/test_placement_groups.py"]
)

py_test(
    name = "tests/test_ray_client",
    tags = ["team:rllib", "tests_dir"],
    size = "large",
    srcs = ["tests/test_ray_client.py"]
)

py_test(
    name = "tests/test_reproducibility",
    tags = ["team:rllib", "tests_dir"],
    size = "medium",
    srcs = ["tests/test_reproducibility.py"]
)

py_test(
    name = "tests/test_timesteps",
    tags = ["team:rllib", "tests_dir"],
    size = "small",
    srcs = ["tests/test_timesteps.py"]
)

# --------------------------------------------------------------------
# examples/ directory
#
# Tag: examples
#
# NOTE: Add tests alphabetically into this list.
# --------------------------------------------------------------------

# subdirectory: _docs/

py_test(
    name = "examples/_docs/rllib_on_rllib_readme",
    main = "examples/_docs/rllib_on_rllib_readme.py",
    tags = ["team:rllib", "documentation", "no_main"],
    size = "medium",
    srcs = ["examples/_docs/rllib_on_rllib_readme.py"],
)

# ----------------------
# Old API stack examples
# ----------------------
# subdirectory: _old_api_stack/
py_test(
    name = "examples/_old_api_stack/complex_struct_space_tf",
    main = "examples/_old_api_stack/complex_struct_space.py",
    tags = ["team:rllib", "exclusive", "examples", "old_api_stack"],
    size = "small",
    srcs = ["examples/_old_api_stack/complex_struct_space.py"],
    args = ["--framework=tf"],
)

py_test(
    name = "examples/_old_api_stack/complex_struct_space_tf_eager",
    main = "examples/_old_api_stack/complex_struct_space.py",
    tags = ["team:rllib", "exclusive", "examples", "old_api_stack"],
    size = "small",
    srcs = ["examples/_old_api_stack/complex_struct_space.py"],
    args = ["--framework=tf2"],
)

py_test(
    name = "examples/_old_api_stack/complex_struct_space_torch",
    main = "examples/_old_api_stack/complex_struct_space.py",
    tags = ["team:rllib", "exclusive", "examples", "old_api_stack"],
    size = "small",
    srcs = ["examples/_old_api_stack/complex_struct_space.py"],
    args = ["--framework=torch"],
)

# subdirectory: _old_api_stack/connectors/
py_test(
    name = "examples/_old_api_stack/connectors/run_connector_policy",
    main = "examples/_old_api_stack/connectors/run_connector_policy.py",
    tags = ["team:rllib", "exclusive", "examples", "old_api_stack"],
    size = "small",
    srcs = ["examples/_old_api_stack/connectors/run_connector_policy.py"],
)

py_test(
    name = "examples/_old_api_stack/connectors/run_connector_policy_w_lstm",
    main = "examples/_old_api_stack/connectors/run_connector_policy.py",
    tags = ["team:rllib", "exclusive", "examples", "old_api_stack"],
    size = "small",
    srcs = ["examples/_old_api_stack/connectors/run_connector_policy.py"],
    args = ["--use-lstm"],
)

py_test(
    name = "examples/_old_api_stack/connectors/adapt_connector_policy",
    main = "examples/_old_api_stack/connectors/adapt_connector_policy.py",
    tags = ["team:rllib", "exclusive", "examples", "old_api_stack"],
    size = "small",
    srcs = ["examples/_old_api_stack/connectors/adapt_connector_policy.py"],
)

# py_test(
#     name = "examples/_old_api_stack/connectors/self_play_with_policy_checkpoint",
#     main = "examples/_old_api_stack/connectors/self_play_with_policy_checkpoint.py",
#     tags = ["team:rllib", "exclusive", "examples", "old_api_stack"],
#     size = "small",
#     srcs = ["examples/_old_api_stack/connectors/self_play_with_policy_checkpoint.py"],
#     args = [
#         "--train_iteration=1"  # Smoke test.
#     ]
# )

# ----------------------
# New API stack
# Note: This includes to-be-translated-to-new-API-stack examples
# tagged by @OldAPIStack and/or @HybridAPIStack
# ----------------------

# subdirectory: actions/

# Nested action spaces (flattening obs and learning w/ multi-action distribution).
py_test(
    name = "examples/actions/nested_action_spaces_ppo",
    main = "examples/actions/nested_action_spaces.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/actions/nested_action_spaces.py"],
    args = ["--enable-new-api-stack", "--as-test", "--framework=torch", "--stop-reward=-500.0", "--algo=PPO"]
)

py_test(
    name = "examples/actions/nested_action_spaces_multi_agent_ppo",
    main = "examples/actions/nested_action_spaces.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/actions/nested_action_spaces.py"],
    args = ["--enable-new-api-stack", "--as-test", "--num-agents=2", "--framework=torch", "--stop-reward=-1000.0", "--algo=PPO"]
)

# subdirectory: catalogs/
# ....................................
py_test(
    name = "examples/catalogs/custom_action_distribution",
    main = "examples/catalogs/custom_action_distribution.py",
    tags = ["team:rllib", "examples", "no_main"],
    size = "small",
    srcs = ["examples/catalogs/custom_action_distribution.py"],
)

py_test(
    name = "examples/catalogs/mobilenet_v2_encoder",
    main = "examples/catalogs/mobilenet_v2_encoder.py",
    tags = ["team:rllib", "examples", "no_main"],
    size = "small",
    srcs = ["examples/catalogs/mobilenet_v2_encoder.py"],
)

# subdirectory: checkpoints/
# ....................................
py_test(
    name = "examples/checkpoints/checkpoint_by_custom_criteria",
    main = "examples/checkpoints/checkpoint_by_custom_criteria.py",
    tags = ["team:rllib", "exclusive", "examples", "examples_use_all_core"],
    size = "large",
    srcs = ["examples/checkpoints/checkpoint_by_custom_criteria.py"],
    args = ["--enable-new-api-stack", "--stop-reward=150.0", "--num-cpus=8"]
)

py_test(
    name = "examples/checkpoints/continue_training_from_checkpoint",
    main = "examples/checkpoints/continue_training_from_checkpoint.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/checkpoints/continue_training_from_checkpoint.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

py_test(
    name = "examples/checkpoints/continue_training_from_checkpoint_multi_agent",
    main = "examples/checkpoints/continue_training_from_checkpoint.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/checkpoints/continue_training_from_checkpoint.py"],
    args = ["--enable-new-api-stack", "--as-test", "--num-agents=2", "--stop-reward-crash=400.0", "--stop-reward=900.0"]
)

#@OldAPIStack
py_test(
    name = "examples/checkpoints/continue_training_from_checkpoint_old_api_stack",
    main = "examples/checkpoints/continue_training_from_checkpoint.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/checkpoints/continue_training_from_checkpoint.py"],
    args = ["--as-test"]
)

py_test(
    name = "examples/checkpoints/cartpole_dqn_export",
    main = "examples/checkpoints/cartpole_dqn_export.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "small",
    srcs = ["examples/checkpoints/cartpole_dqn_export.py"],
)

#@OldAPIStack
py_test(
    name = "examples/checkpoints/onnx_tf2",
    main = "examples/checkpoints/onnx_tf.py",
    tags = ["team:rllib", "exclusive", "examples", "no_main"],
    size = "small",
    srcs = ["examples/checkpoints/onnx_tf.py"],
    args = ["--framework=tf2"],
)

#@OldAPIStack
py_test(
    name = "examples/checkpoints/onnx_torch",
    main = "examples/checkpoints/onnx_torch.py",
    tags = ["team:rllib", "exclusive", "examples", "no_main"],
    size = "small",
    srcs = ["examples/checkpoints/onnx_torch.py"],
)

#@OldAPIStack
py_test(
    name = "examples/checkpoints/onnx_torch_lstm",
    main = "examples/checkpoints/onnx_torch_lstm.py",
    tags = ["team:rllib", "exclusive", "examples", "no_main"],
    size = "small",
    srcs = ["examples/checkpoints/onnx_torch_lstm.py"],
)

# subdirectory: connectors/
# ....................................
# Framestacking examples only run in smoke-test mode (a few iters only).
# PPO
py_test(
    name = "examples/connectors/frame_stacking_ppo",
    main = "examples/connectors/frame_stacking.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/connectors/frame_stacking.py"],
    args = ["--enable-new-api-stack", "--stop-iter=2", "--framework=torch", "--algo=PPO"]
)

py_test(
    name = "examples/connectors/frame_stacking_multi_agent_ppo",
    main = "examples/connectors/frame_stacking.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/connectors/frame_stacking.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--stop-iter=2", "--framework=torch", "--algo=PPO", "--num-env-runners=4", "--num-cpus=6"]
)
# IMPALA
py_test(
    name = "examples/connectors/frame_stacking_impala",
    main = "examples/connectors/frame_stacking.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/connectors/frame_stacking.py"],
    args = ["--enable-new-api-stack", "--stop-iter=2", "--framework=torch", "--algo=IMPALA"]
)
py_test(
    name = "examples/connectors/frame_stacking_multi_agent_impala",
    main = "examples/connectors/frame_stacking.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/connectors/frame_stacking.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--stop-iter=2", "--framework=torch", "--algo=IMPALA", "--num-env-runners=4", "--num-cpus=6"]
)

# Nested observation spaces (flattening).
# PPO
py_test(
    name = "examples/connectors/flatten_observations_dict_space_ppo",
    main = "examples/connectors/flatten_observations_dict_space.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/connectors/flatten_observations_dict_space.py"],
    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=400.0", "--framework=torch", "--algo=PPO"]
)
py_test(
    name = "examples/connectors/flatten_observations_dict_space_multi_agent_ppo",
    main = "examples/connectors/flatten_observations_dict_space.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/connectors/flatten_observations_dict_space.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--stop-reward=800.0", "--framework=torch", "--algo=PPO"]
)
# IMPALA
py_test(
    name = "examples/connectors/flatten_observations_dict_space_impala",
    main = "examples/connectors/flatten_observations_dict_space.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/connectors/flatten_observations_dict_space.py"],
    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=400.0", "--stop-timesteps=2000000", "--framework=torch", "--algo=IMPALA"]
)
py_test(
    name = "examples/connectors/flatten_observations_dict_space_multi_agent_impala",
    main = "examples/connectors/flatten_observations_dict_space.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/connectors/flatten_observations_dict_space.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--stop-reward=800.0", "--stop-timesteps=2000000", "--framework=torch", "--algo=IMPALA"]
)

# Prev-r/prev actions + LSTM example.
py_test(
    name = "examples/connectors/prev_actions_prev_rewards_ppo",
    main = "examples/connectors/prev_actions_prev_rewards.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/connectors/prev_actions_prev_rewards.py"],
    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=200.0", "--framework=torch", "--algo=PPO", "--num-env-runners=4", "--num-cpus=6"]
)

py_test(
    name = "examples/connectors/prev_actions_prev_rewards_multi_agent_ppo",
    main = "examples/connectors/prev_actions_prev_rewards.py",
    tags = ["team:rllib", "exclusive", "examples", "examples_use_all_core"],
    size = "large",
    srcs = ["examples/connectors/prev_actions_prev_rewards.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--stop-reward=400.0", "--framework=torch", "--algo=PPO", "--num-env-runners=4", "--num-cpus=6"]
)

# MeanStd filtering example.
# PPO
py_test(
    name = "examples/connectors/mean_std_filtering_ppo",
    main = "examples/connectors/mean_std_filtering.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/connectors/mean_std_filtering.py"],
    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=-300.0", "--framework=torch", "--algo=PPO", "--num-env-runners=2", "--num-cpus=4"]
)

py_test(
    name = "examples/connectors/mean_std_filtering_multi_agent_ppo",
    main = "examples/connectors/mean_std_filtering.py",
    tags = ["team:rllib", "exclusive", "examples", "examples_use_all_core"],
    size = "large",
    srcs = ["examples/connectors/mean_std_filtering.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--stop-reward=-600.0", "--framework=torch", "--algo=PPO", "--num-env-runners=5", "--num-cpus=7"]
)
# IMPALA
# TODO (sven): Make IMPALA learn Pendulum OR make this script flexible to accept
#  (lopsided obs) CartPole as well.
# py_test(
#    name = "examples/connectors/mean_std_filtering_impala",
#    main = "examples/connectors/mean_std_filtering.py",
#    tags = ["team:rllib", "exclusive", "examples"],
#    size = "medium",
#    srcs = ["examples/connectors/mean_std_filtering.py"],
#    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=-300.0", "--framework=torch", "--algo=IMPALA", "--num-env-runners=2"]
# )
# py_test(
#    name = "examples/connectors/mean_std_filtering_multi_agent_impala",
#    main = "examples/connectors/mean_std_filtering.py",
#    tags = ["team:rllib", "exclusive", "examples"],
#    size = "medium",
#    srcs = ["examples/connectors/mean_std_filtering.py"],
#    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--stop-reward=-600.0", "--framework=torch", "--algo=IMPALA", "--num-env-runners=5", "--num-cpus=6"]
# )

# subdirectory: curiosity/
# ....................................
py_test(
    name = "examples/curiosity/count_based_curiosity",
    main = "examples/curiosity/count_based_curiosity.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/curiosity/count_based_curiosity.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

py_test(
    name = "examples/curiosity/euclidian_distance_based_curiosity",
    main = "examples/curiosity/euclidian_distance_based_curiosity.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/curiosity/euclidian_distance_based_curiosity.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

py_test(
    name = "examples/curiosity/intrinsic_curiosity_model_based_curiosity_ppo",
    main = "examples/curiosity/intrinsic_curiosity_model_based_curiosity.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/curiosity/intrinsic_curiosity_model_based_curiosity.py"],
    args = ["--enable-new-api-stack", "--as-test", "--algo=PPO"]
)

# TODO (sven): Learns, but very slowly. Needs further tuning.
# py_test(
#    name = "examples/curiosity/intrinsic_curiosity_model_based_curiosity_dqn",
#    main = "examples/curiosity/intrinsic_curiosity_model_based_curiosity.py",
#    tags = ["team:rllib", "exclusive", "examples"],
#    size = "large",
#    srcs = ["examples/curiosity/intrinsic_curiosity_model_based_curiosity.py"],
#    args = ["--enable-new-api-stack", "--as-test", "--algo=DQN"]
# )


# subdirectory: curriculum/
# ....................................
py_test(
    name = "examples/curriculum/curriculum_learning",
    main = "examples/curriculum/curriculum_learning.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/curriculum/curriculum_learning.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

# subdirectory: debugging/
# ....................................
#@OldAPIStack
py_test(
    name = "examples/debugging/deterministic_training_torch",
    main = "examples/debugging/deterministic_training.py",
    tags = ["team:rllib", "exclusive", "multi_gpu", "examples"],
    size = "medium",
    srcs = ["examples/debugging/deterministic_training.py"],
    args = ["--as-test", "--stop-iters=1", "--framework=torch", "--num-gpus=1", "--num-gpus-per-env-runner=1"]
)

# subdirectory: envs/
# ....................................
py_test(
    name = "examples/envs/custom_gym_env",
    main = "examples/envs/custom_gym_env.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/envs/custom_gym_env.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

py_test(
    name = "examples/envs/custom_env_render_method",
    main = "examples/envs/custom_env_render_method.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/envs/custom_env_render_method.py"],
    args = ["--enable-new-api-stack", "--num-agents=0"]
)

py_test(
    name = "examples/envs/custom_env_render_method_multi_agent",
    main = "examples/envs/custom_env_render_method.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/envs/custom_env_render_method.py"],
    args = ["--enable-new-api-stack", "--num-agents=2"]
)

py_test(
    name = "examples/envs/env_rendering_and_recording",
    srcs = ["examples/envs/env_rendering_and_recording.py"],
    tags = ["team:rllib", "exclusive", "examples"],
    size = "small",
    args = ["--enable-new-api-stack", "--env=CartPole-v1", "--stop-iters=3"]
)

#@OldAPIStack
py_test(
    name = "examples/envs/greyscale_env",
    tags = ["team:rllib", "examples", "no_main"],
    size = "medium",
    srcs = ["examples/envs/greyscale_env.py"],
    args = ["--stop-iters=1 --as-test --framework torch"]
)

# subdirectory: evaluation/
# ....................................
py_test(
    name = "examples/evaluation/custom_evaluation",
    main = "examples/evaluation/custom_evaluation.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/custom_evaluation.py"],
    args = ["--enable-new-api-stack", "--framework=torch", "--as-test", "--stop-reward=0.75", "--num-cpus=5"]
)

py_test(
    name = "examples/evaluation/custom_evaluation_parallel_to_training",
    main = "examples/evaluation/custom_evaluation.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/custom_evaluation.py"],
    args = ["--enable-new-api-stack", "--as-test", "--framework=torch", "--stop-reward=0.75", "--evaluation-parallel-to-training", "--num-cpus=5"]
)

py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_duration_auto_torch",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--enable-new-api-stack", "--as-test", "--evaluation-parallel-to-training", "--stop-reward=450.0", "--num-cpus=6", "--evaluation-duration=auto"]
)

py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_multi_agent_duration_auto_torch",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples", "examples_use_all_core"],
    size = "large",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--evaluation-parallel-to-training", "--stop-reward=900.0", "--num-cpus=6", "--evaluation-duration=auto", "--evaluation-duration-unit=episodes"]
)

py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_511_ts_torch",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--enable-new-api-stack", "--as-test", "--evaluation-parallel-to-training", "--stop-reward=450.0", "--num-cpus=6", "--evaluation-num-env-runners=3", "--evaluation-duration=511", "--evaluation-duration-unit=timesteps"]
)

py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_multi_agent_1001_ts_torch",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--evaluation-parallel-to-training", "--stop-reward=900.0", "--num-cpus=6", "--evaluation-duration=1001", "--evaluation-duration-unit=timesteps"]
)

py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_13_episodes_torch",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--enable-new-api-stack", "--as-test", "--evaluation-parallel-to-training", "--stop-reward=450.0", "--num-cpus=6", "--evaluation-duration=13", "--evaluation-duration-unit=episodes"]
)

py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_multi_agent_10_episodes_torch",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--evaluation-parallel-to-training", "--stop-reward=900.0", "--num-cpus=6", "--evaluation-duration=10", "--evaluation-duration-unit=episodes"]
)

# @OldAPIStack
py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_duration_auto_torch_old_api_stack",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--as-test", "--evaluation-parallel-to-training", "--stop-reward=50.0", "--num-cpus=6", "--evaluation-duration=auto"]
)

# @OldAPIStack
py_test(
    name = "examples/evaluation/evaluation_parallel_to_training_211_ts_torch_old_api_stack",
    main = "examples/evaluation/evaluation_parallel_to_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/evaluation/evaluation_parallel_to_training.py"],
    args = ["--as-test", "--evaluation-parallel-to-training", "--framework=torch", "--stop-reward=30.0", "--num-cpus=6", "--evaluation-num-env-runners=3", "--evaluation-duration=211", "--evaluation-duration-unit=timesteps"]
)

# subdirectory: fault_tolerance/
# ....................................
py_test(
    name = "examples/fault_tolerance/crashing_cartpole_recreate_failed_env_runners_appo",
    main = "examples/fault_tolerance/crashing_and_stalling_env.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/fault_tolerance/crashing_and_stalling_env.py"],
    args = ["--algo=APPO", "--enable-new-api-stack", "--as-test", "--stop-reward=450.0"]
)
py_test(
    name = "examples/fault_tolerance/crashing_cartpole_restart_failed_envs_appo",
    main = "examples/fault_tolerance/crashing_and_stalling_env.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/fault_tolerance/crashing_and_stalling_env.py"],
    args = ["--algo=APPO", "--enable-new-api-stack", "--as-test", "--restart-failed-envs", "--stop-reward=450.0"]
)
py_test(
    name = "examples/fault_tolerance/crashing_and_stalling_cartpole_restart_failed_envs_ppo",
    main = "examples/fault_tolerance/crashing_and_stalling_env.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/fault_tolerance/crashing_and_stalling_env.py"],
    args = ["--algo=PPO", "--enable-new-api-stack", "--as-test", "--restart-failed-envs", "--stall", "--stop-reward=450.0"]
)
py_test(
    name = "examples/fault_tolerance/crashing_and_stalling_multi_agent_cartpole_restart_failed_envs_ppo",
    main = "examples/fault_tolerance/crashing_and_stalling_env.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/fault_tolerance/crashing_and_stalling_env.py"],
    args = ["--algo=PPO", "--num-agents=2", "--enable-new-api-stack", "--as-test", "--restart-failed-envs", "--stop-reward=800.0"]
)

# subdirectory: gpus/
# ....................................
py_test(
    name = "examples/gpus/float16_training_and_inference",
    main = "examples/gpus/float16_training_and_inference.py",
    tags = ["team:rllib", "exclusive", "examples", "gpu"],
    size = "medium",
    srcs = ["examples/gpus/float16_training_and_inference.py"],
    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=150.0"]
)
py_test(
    name = "examples/gpus/mixed_precision_training_float16_inference",
    main = "examples/gpus/mixed_precision_training_float16_inference.py",
    tags = ["team:rllib", "exclusive", "examples", "gpu"],
    size = "medium",
    srcs = ["examples/gpus/mixed_precision_training_float16_inference.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)
py_test(
    name = "examples/gpus/fractional_0.5_gpus_per_learner",
    main = "examples/gpus/fractional_gpus_per_learner.py",
    tags = ["team:rllib", "exclusive", "examples", "multi_gpu"],
    size = "medium",
    srcs = ["examples/gpus/fractional_gpus_per_learner.py"],
    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=40.0", "--num-learners=1", "--num-gpus-per-learner=0.5"]
)
py_test(
    name = "examples/gpus/fractional_0.2_gpus_per_learner",
    main = "examples/gpus/fractional_gpus_per_learner.py",
    tags = ["team:rllib", "exclusive", "examples", "gpu"],
    size = "medium",
    srcs = ["examples/gpus/fractional_gpus_per_learner.py"],
    args = ["--enable-new-api-stack", "--as-test", "--stop-reward=40.0", "--num-learners=1", "--num-gpus-per-learner=0.2"]
)

# subdirectory: hierarchical/
# ....................................
#@OldAPIStack
py_test(
    name = "examples/hierarchical/hierarchical_training_tf",
    main = "examples/hierarchical/hierarchical_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/hierarchical/hierarchical_training.py"],
    args = [ "--framework=tf", "--stop-reward=0.0"]
)

#@OldAPIStack
py_test(
    name = "examples/hierarchical/hierarchical_training_torch",
    main = "examples/hierarchical/hierarchical_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/hierarchical/hierarchical_training.py"],
    args = ["--framework=torch", "--stop-reward=0.0"]
)

# subdirectory: inference/
# ....................................
py_test(
    name = "examples/inference/policy_inference_after_training",
    main = "examples/inference/policy_inference_after_training.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/inference/policy_inference_after_training.py"],
    args = ["--enable-new-api-stack", "--stop-reward=100.0"]
)

py_test(
    name = "examples/inference/policy_inference_after_training_w_connector",
    main = "examples/inference/policy_inference_after_training_w_connector.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/inference/policy_inference_after_training_w_connector.py"],
    args = ["--enable-new-api-stack", "--stop-reward=150.0"]
)

#@OldAPIStack
py_test(
    name = "examples/inference/policy_inference_after_training_with_attention_tf",
    main = "examples/inference/policy_inference_after_training_with_attention.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/inference/policy_inference_after_training_with_attention.py"],
    args = ["--stop-iters=2", "--framework=tf"]
)

#@OldAPIStack
py_test(
    name = "examples/inference/policy_inference_after_training_with_attention_torch",
    main = "examples/inference/policy_inference_after_training_with_attention.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/inference/policy_inference_after_training_with_attention.py"],
    args = ["--stop-iters=2", "--framework=torch"]
)

#@OldAPIStack
py_test(
    name = "examples/inference/policy_inference_after_training_with_lstm_tf",
    main = "examples/inference/policy_inference_after_training_with_lstm.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/inference/policy_inference_after_training_with_lstm.py"],
    args = ["--stop-iters=1", "--framework=tf"]
)

#@OldAPIStack
py_test(
    name = "examples/inference/policy_inference_after_training_with_lstm_torch",
    main = "examples/inference/policy_inference_after_training_with_lstm.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/inference/policy_inference_after_training_with_lstm.py"],
    args = ["--stop-iters=1", "--framework=torch"]
)

# subdirectory: learners/
# ....................................
py_test(
    name = "examples/learners/custom_loss_fn_simple",
    main = "examples/learners/custom_loss_fn_simple.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/learners/custom_loss_fn_simple.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

py_test(
    name = "examples/learners/separate_vf_lr_and_optimizer",
    main = "examples/learners/separate_vf_lr_and_optimizer.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/learners/separate_vf_lr_and_optimizer.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

py_test(
    name = "examples/learners/ppo_with_torch_lr_schedulers",
    main = "examples/learners/ppo_with_torch_lr_schedulers.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/learners/ppo_with_torch_lr_schedulers.py"],
    args = ["--enable-new-api-stack", "--as-test"]
)

# subdirectory: metrics/
# ....................................

py_test(
    name = "examples/metrics/custom_metrics_in_env_runners",
    main = "examples/metrics/custom_metrics_in_env_runners.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/metrics/custom_metrics_in_env_runners.py"],
    args = ["--enable-new-api-stack", "--stop-iters=3"]
)

# subdirectory: multi_agent/
# ....................................
py_test(
    name = "examples/multi_agent/custom_heuristic_policy",
    main = "examples/multi_agent/custom_heuristic_policy.py",
    tags = ["team:rllib", "exclusive", "examples", "examples_use_all_core"],
    size = "large",
    srcs = ["examples/multi_agent/custom_heuristic_policy.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=450.0"]
)

py_test(
    name = "examples/multi_agent/different_spaces_for_agents_ppo",
    main = "examples/multi_agent/different_spaces_for_agents.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "small",
    srcs = ["examples/multi_agent/different_spaces_for_agents.py"],
    args = ["--enable-new-api-stack", "--algo=PPO", "--stop-iters=4", "--framework=torch"]
)

py_test(
    name = "examples/multi_agent/multi_agent_cartpole",
    main = "examples/multi_agent/multi_agent_cartpole.py",
    tags = ["team:rllib", "exclusive", "examples", "examples_use_all_core"],
    size = "large",
    srcs = ["examples/multi_agent/multi_agent_cartpole.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=600.0", "--num-cpus=4"]
)

py_test(
    name = "examples/multi_agent/multi_agent_pendulum_multi_gpu",
    main = "examples/multi_agent/multi_agent_pendulum.py",
    tags = ["team:rllib", "exclusive", "examples", "multi_gpu"],
    size = "large",
    srcs = ["examples/multi_agent/multi_agent_pendulum.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=-500.0", "--num-cpus=5", "--num-gpus=2"]
)

py_test(
    name = "examples/multi_agent/pettingzoo_independent_learning",
    main = "examples/multi_agent/pettingzoo_independent_learning.py",
    tags = ["team:rllib", "examples"],
    size = "large",
    srcs = ["examples/multi_agent/pettingzoo_independent_learning.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=-200.0", "--num-cpus=4"]
)

py_test(
    name = "examples/multi_agent/pettingzoo_parameter_sharing",
    main = "examples/multi_agent/pettingzoo_parameter_sharing.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/multi_agent/pettingzoo_parameter_sharing.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=-210.0", "--num-cpus=4"],
)

# TODO (sven): Activate this test once this script is ready.
# py_test(
#    name = "examples/multi_agent/pettingzoo_shared_value_function",
#    main = "examples/multi_agent/pettingzoo_shared_value_function.py",
#    tags = ["team:rllib", "exclusive", "examples"],
#    size = "large",
#    srcs = ["examples/multi_agent/pettingzoo_shared_value_function.py"],
#    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=-100.0", "--num-cpus=4"],
# )

py_test(
    name = "examples/checkpoints/restore_1_of_n_agents_from_checkpoint",
    main = "examples/checkpoints/restore_1_of_n_agents_from_checkpoint.py",
    tags = ["team:rllib", "exclusive", "examples", "examples_use_all_core", "no_main"],
    size = "large",
    srcs = ["examples/checkpoints/restore_1_of_n_agents_from_checkpoint.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--framework=torch", "--checkpoint-freq=20", "--checkpoint-at-end", "--num-cpus=4", "--algo=PPO"]
)

py_test(
    name = "examples/multi_agent/rock_paper_scissors_heuristic_vs_learned",
    main = "examples/multi_agent/rock_paper_scissors_heuristic_vs_learned.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/multi_agent/rock_paper_scissors_heuristic_vs_learned.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=6.5"],
)

py_test(
    name = "examples/multi_agent/rock_paper_scissors_heuristic_vs_learned_w_lstm",
    main = "examples/multi_agent/rock_paper_scissors_heuristic_vs_learned.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/multi_agent/rock_paper_scissors_heuristic_vs_learned.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=7.2", "--use-lstm", "--num-env-runners=4", "--num-cpus=6"],
)

py_test(
    name = "examples/multi_agent/rock_paper_scissors_learned_vs_learned",
    main = "examples/multi_agent/rock_paper_scissors_learned_vs_learned.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/multi_agent/rock_paper_scissors_learned_vs_learned.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--framework=torch", "--stop-iter=10"],
)

# @OldAPIStack
py_test(
    name = "examples/multi_agent/self_play_with_open_spiel_connect_4_ppo_tf_old_api_stack",
    main = "examples/multi_agent/self_play_with_open_spiel.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/multi_agent/self_play_with_open_spiel.py"],
    args = ["--framework=tf", "--env=connect_four", "--win-rate-threshold=0.9", "--num-episodes-human-play=0", "--min-league-size=3"]
)

# @OldAPIStack
py_test(
    name = "examples/multi_agent/self_play_with_open_spiel_connect_4_ppo_torch_old_api_stack",
    main = "examples/multi_agent/self_play_with_open_spiel.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/multi_agent/self_play_with_open_spiel.py"],
    args = ["--framework=torch", "--env=connect_four", "--win-rate-threshold=0.9", "--num-episodes-human-play=0", "--min-league-size=3"]
)

py_test(
    name = "examples/multi_agent/self_play_with_open_spiel_connect_4_ppo_torch",
    main = "examples/multi_agent/self_play_with_open_spiel.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/multi_agent/self_play_with_open_spiel.py"],
    args = ["--enable-new-api-stack", "--framework=torch", "--env=connect_four", "--win-rate-threshold=0.9", "--num-episodes-human-play=0", "--min-league-size=4"]
)

py_test(
    name = "examples/multi_agent/self_play_league_based_with_open_spiel_connect_4_ppo_torch",
    main = "examples/multi_agent/self_play_league_based_with_open_spiel.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "large",
    srcs = ["examples/multi_agent/self_play_league_based_with_open_spiel.py"],
    args = ["--enable-new-api-stack", "--framework=torch", "--env=connect_four", "--win-rate-threshold=0.8", "--num-episodes-human-play=0", "--min-league-size=8"]
)

py_test(
    name = "examples/multi_agent/two_step_game_with_grouped_agents",
    main = "examples/multi_agent/two_step_game_with_grouped_agents.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/multi_agent/two_step_game_with_grouped_agents.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--as-test", "--framework=torch", "--stop-reward=7.0"]
)

# subdirectory: offline_rl/
# ....................................

py_test(
    name = "examples/offline_rl/train_w_bc_finetune_w_ppo",
    main = "examples/offline_rl/train_w_bc_finetune_w_ppo.py",
    tags = ["team:rllib", "examples", "exclusive"],
    size = "medium",
    srcs = ["examples/offline_rl/train_w_bc_finetune_w_ppo.py"],
    args = ["--enable-new-api-stack", "--as-test", "--framework=torch"],
    # Include the offline data files.
    data = ["tests/data/cartpole/cartpole-v1_large"]
)

# @HybridAPIStack
# py_test(
#     name = "examples/offline_rl/pretrain_bc_single_agent_evaluate_as_multi_agent",
#     main = "examples/offline_rl/pretrain_bc_single_agent_evaluate_as_multi_agent.py",
#     tags = ["team:rllib", "exclusive", "examples"],
#     size = "large",
#     srcs = ["examples/offline_rl/pretrain_bc_single_agent_evaluate_as_multi_agent.py"],
#     data = ["tests/data/cartpole/large.json"],
#     args = ["--as-test"]
# )

#@OldAPIStack
# TODO (sven): Doesn't seem to learn at the moment. Uncomment once fixed.
# py_test(
#    name = "examples/offline_rl/custom_input_api_cql_torch",
#    main = "examples/offline_rl/custom_input_api.py",
#    tags = ["team:rllib", "exclusive", "examples"],
#    size = "medium",
#    srcs = ["examples/offline_rl/custom_input_api.py"],
#    args = ["--as-test", "--stop-reward=-300", "--stop-iters=1"]
# )

#@OldAPIStack
py_test(
    name = "examples/offline_rl/offline_rl_torch_old_api_stack",
    main = "examples/offline_rl/offline_rl.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/offline_rl/offline_rl.py"],
    args = ["--as-test", "--stop-reward=-300", "--stop-iters=1"]
)

# subdirectory: ray_serve/
# ....................................
# TODO (sven): Uncomment once the problem with the path on BAZEL is solved.
# py_test(
#    name = "examples/ray_serve/ray_serve_with_rllib",
#    main = "examples/ray_serve/ray_serve_with_rllib.py",
#    tags = ["team:rllib", "exclusive", "examples"],
#    size = "medium",
#    srcs = ["examples/ray_serve/ray_serve_with_rllib.py"],
#    args = ["--train-iters=2", "--serve-episodes=2", "--no-render"]
# )

# subdirectory: ray_tune/
# ....................................
py_test(
    name = "examples/ray_tune/custom_experiment",
    main = "examples/ray_tune/custom_experiment.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/ray_tune/custom_experiment.py"],
)

py_test(
    name = "examples/ray_tune/custom_logger",
    main = "examples/ray_tune/custom_logger.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/ray_tune/custom_logger.py"],
)

py_test(
    name = "examples/ray_tune/custom_progress_reporter",
    main = "examples/ray_tune/custom_progress_reporter.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/ray_tune/custom_progress_reporter.py"],
)

# subdirectory: rl_modules/
# ....................................
py_test(
    name = "examples/rl_modules/action_masking_rl_module",
    main = "examples/rl_modules/action_masking_rl_module.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/rl_modules/action_masking_rl_module.py"],
    args = ["--enable-new-api-stack", "--stop-iters=5"],
)

py_test(
    name = "examples/rl_modules/autoregressive_actions_rl_module",
    main = "examples/rl_modules/autoregressive_actions_rl_module.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/rl_modules/autoregressive_actions_rl_module.py"],
    args = ["--enable-new-api-stack"],
)
py_test(
    name = "examples/rl_modules/custom_cnn_rl_module",
    main = "examples/rl_modules/custom_cnn_rl_module.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/rl_modules/custom_cnn_rl_module.py"],
    args = ["--enable-new-api-stack", "--stop-iters=3"],
)
py_test(
    name = "examples/rl_modules/custom_lstm_rl_module",
    main = "examples/rl_modules/custom_lstm_rl_module.py",
    tags = ["team:rllib", "examples"],
    size = "large",
    srcs = ["examples/rl_modules/custom_lstm_rl_module.py"],
    args = ["--as-test", "--enable-new-api-stack"],
)
py_test(
    name = "examples/rl_modules/classes/mobilenet_rlm",
    main = "examples/rl_modules/classes/mobilenet_rlm.py",
    tags = ["team:rllib", "examples", "no_main"],
    size = "small",
    srcs = ["examples/rl_modules/classes/mobilenet_rlm.py"],
)

py_test(
    name = "examples/rl_modules/migrate_modelv2_to_new_api_stack_by_config",
    main = "examples/rl_modules/migrate_modelv2_to_new_api_stack_by_config.py",
    tags = ["team:rllib", "examples"],
    size = "large",
    srcs = ["examples/rl_modules/migrate_modelv2_to_new_api_stack_by_config.py"],
)
py_test(
    name = "examples/rl_modules/migrate_modelv2_to_new_api_stack_by_policy_checkpoint",
    main = "examples/rl_modules/migrate_modelv2_to_new_api_stack_by_policy_checkpoint.py",
    tags = ["team:rllib", "examples"],
    size = "large",
    srcs = ["examples/rl_modules/migrate_modelv2_to_new_api_stack_by_policy_checkpoint.py"],
)
py_test(
    name = "examples/rl_modules/pretraining_single_agent_training_multi_agent",
    main = "examples/rl_modules/pretraining_single_agent_training_multi_agent.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/rl_modules/pretraining_single_agent_training_multi_agent.py"],
    args = ["--enable-new-api-stack", "--num-agents=2", "--stop-iters-pretraining=5", "--stop-iters=20", "--stop-reward=150.0"],
)

#@OldAPIStack
py_test(
    name = "examples/autoregressive_action_dist_tf",
    main = "examples/autoregressive_action_dist.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/autoregressive_action_dist.py"],
    args = ["--as-test", "--framework=tf", "--stop-reward=-0.012", "--num-cpus=4"]
)

#@OldAPIStack
py_test(
    name = "examples/autoregressive_action_dist_torch",
    main = "examples/autoregressive_action_dist.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/autoregressive_action_dist.py"],
    args = ["--as-test", "--framework=torch", "--stop-reward=-0.012", "--num-cpus=4"]
)

#@OldAPIStack
py_test(
    name = "examples/centralized_critic_tf",
    main = "examples/centralized_critic.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/centralized_critic.py"],
    args = ["--as-test", "--framework=tf", "--stop-reward=7.2"]
)

#@OldAPIStack
py_test(
    name = "examples/centralized_critic_torch",
    main = "examples/centralized_critic.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/centralized_critic.py"],
    args = ["--as-test", "--framework=torch", "--stop-reward=7.2"]
)

#@OldAPIStack
py_test(
    name = "examples/centralized_critic_2_tf",
    main = "examples/centralized_critic_2.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/centralized_critic_2.py"],
    args = ["--as-test", "--framework=tf", "--stop-reward=6.0"]
)

#@OldAPIStack
py_test(
    name = "examples/centralized_critic_2_torch",
    main = "examples/centralized_critic_2.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/centralized_critic_2.py"],
    args = ["--as-test", "--framework=torch", "--stop-reward=6.0"]
)

py_test(
    name = "examples/custom_recurrent_rnn_tokenizer_repeat_after_me_tf2",
    main = "examples/custom_recurrent_rnn_tokenizer.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/custom_recurrent_rnn_tokenizer.py"],
    args = ["--as-test", "--framework=tf2", "--stop-reward=40", "--env=RepeatAfterMeEnv", "--num-cpus=4"]
)

py_test(
    name = "examples/custom_recurrent_rnn_tokenizer_repeat_initial_obs_env_tf2",
    main = "examples/custom_recurrent_rnn_tokenizer.py",
    tags = ["team:rllib", "examples"],
    size = "medium",
    srcs = ["examples/custom_recurrent_rnn_tokenizer.py"],
    args = ["--as-test", "--framework=tf2", "--stop-reward=10", "--stop-timesteps=300000", "--env=RepeatInitialObsEnv", "--num-cpus=4"]
)

py_test(
    name = "examples/custom_recurrent_rnn_tokenizer_repeat_after_me_torch",
    main = "examples/custom_recurrent_rnn_tokenizer.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/custom_recurrent_rnn_tokenizer.py"],
    args = ["--as-test", "--framework=torch", "--stop-reward=40", "--env=RepeatAfterMeEnv", "--num-cpus=4"]
)

py_test(
    name = "examples/custom_recurrent_rnn_tokenizer_repeat_initial_obs_env_torch",
    main = "examples/custom_recurrent_rnn_tokenizer.py",
    tags = ["team:rllib", "exclusive", "examples"],
    size = "medium",
    srcs = ["examples/custom_recurrent_rnn_tokenizer.py"],
    args = ["--as-test", "--framework=torch", "--stop-reward=10", "--stop-timesteps=300000", "--env=RepeatInitialObsEnv", "--num-cpus=4"]
)

py_test(
    name = "examples/replay_buffer_api",
    tags = ["team:rllib", "examples"],
    size = "large",
    srcs = ["examples/replay_buffer_api.py"],
)


# --------------------------------------------------------------------
# Manual/disabled tests
# --------------------------------------------------------------------
py_test_module_list(
  files = [
    "utils/tests/test_utils.py",
  ],
  size = "large",
  extra_srcs = [],
  deps = [],
  tags = ["manual", "team:rllib", "no_main"],
)