CS计算机代考程序代写 ;; Automatically produced by rddl.translate.RDDL2Format

;; Automatically produced by rddl.translate.RDDL2Format
(define (domain skill_teaching_mdp)
(:requirements :adl :probabilistic-effects :rewards)
(:predicates
(hintedRight__s0)
(hintedRight__s1)
(proficiencyHigh__s0)
(proficiencyHigh__s1)
(updateTurn__s0)
(updateTurn__s1)
(answeredRight__s0)
(answeredRight__s1)
(proficiencyMed__s0)
(proficiencyMed__s1)
(hintDelayVar__s0)
(hintDelayVar__s1)
)
(:action askProb__s0
:effect (and
(probabilistic 1.0 (not (hintedRight__s0)))
(probabilistic 1.0 (not (hintedRight__s1)))
(when (and (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0) (proficiencyMed__s0)) (probabilistic 1.0 (proficiencyHigh__s0) ))
(when (and (proficiencyHigh__s0) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 0.04352919459342952 (not (proficiencyHigh__s0))))
(when (and (proficiencyHigh__s0) (updateTurn__s0) (not (answeredRight__s0)) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyHigh__s0))))
(when (and (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1) (proficiencyMed__s1)) (probabilistic 1.0 (proficiencyHigh__s1) ))
(when (and (proficiencyHigh__s1) (not (updateTurn__s0)) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (not (updateTurn__s1))) (probabilistic 0.018769168853759788 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (updateTurn__s0) ))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (updateTurn__s0))))
(probabilistic 1.0 (not (updateTurn__s1)))
(when (and (not (proficiencyHigh__s0)) (not (updateTurn__s0)) (not (updateTurn__s1)) (not (proficiencyMed__s0))) (probabilistic 0.56987906 (answeredRight__s0) 0.43012094 (not (answeredRight__s0))))
(when (and (not (proficiencyHigh__s0)) (not (updateTurn__s0)) (not (updateTurn__s1)) (proficiencyMed__s0)) (probabilistic 0.71801746 (answeredRight__s0) 0.28198254 (not (answeredRight__s0))))
(when (and (not (proficiencyHigh__s0)) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (answeredRight__s0))))
(when (and (not (proficiencyHigh__s0)) (updateTurn__s0)) (probabilistic 1.0 (not (answeredRight__s0))))
(when (and (proficiencyHigh__s0) (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 0.9066789 (answeredRight__s0) 0.09332110000000005 (not (answeredRight__s0))))
(when (and (proficiencyHigh__s0) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (answeredRight__s0))))
(when (and (proficiencyHigh__s0) (updateTurn__s0)) (probabilistic 1.0 (not (answeredRight__s0))))
(probabilistic 1.0 (not (answeredRight__s1)))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (not (answeredRight__s0)) (proficiencyMed__s0) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyMed__s0))))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s0)) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (not (proficiencyHigh__s0)) (updateTurn__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (not (answeredRight__s1)) (proficiencyMed__s1) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyMed__s1))))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (not (hintedRight__s1)) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (not (proficiencyHigh__s1)) (updateTurn__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(probabilistic 1.0 (not (hintDelayVar__s0)))
(probabilistic 1.0 (not (hintDelayVar__s1)))
; Reward
(when (proficiencyHigh__s0) (increase (reward) 1.1778302))
(when (proficiencyHigh__s1) (increase (reward) 1.2346091))
(when (not (proficiencyMed__s0)) (decrease (reward) 1.1778302))
(when (not (proficiencyMed__s1)) (decrease (reward) 1.2346091))
)
)
(:action askProb__s1
:effect (and
(probabilistic 1.0 (not (hintedRight__s0)))
(probabilistic 1.0 (not (hintedRight__s1)))
(when (and (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0) (proficiencyMed__s0)) (probabilistic 1.0 (proficiencyHigh__s0) ))
(when (and (proficiencyHigh__s0) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 0.04352919459342952 (not (proficiencyHigh__s0))))
(when (and (proficiencyHigh__s0) (updateTurn__s0) (not (answeredRight__s0)) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyHigh__s0))))
(when (and (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1) (proficiencyMed__s1)) (probabilistic 1.0 (proficiencyHigh__s1) ))
(when (and (proficiencyHigh__s1) (not (updateTurn__s0)) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (not (updateTurn__s1))) (probabilistic 0.018769168853759788 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(probabilistic 1.0 (not (updateTurn__s0)))
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (updateTurn__s1) ))
(when (and (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (updateTurn__s1))))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (updateTurn__s1))))
(probabilistic 1.0 (not (answeredRight__s0)))
(when (and (not (proficiencyHigh__s1)) (not (updateTurn__s0)) (not (updateTurn__s1)) (not (proficiencyMed__s1))) (probabilistic 0.7414986 (answeredRight__s1) 0.2585014 (not (answeredRight__s1))))
(when (and (not (proficiencyHigh__s1)) (not (updateTurn__s0)) (not (updateTurn__s1)) (proficiencyMed__s1)) (probabilistic 0.7900833 (answeredRight__s1) 0.20991669999999996 (not (answeredRight__s1))))
(when (and (not (proficiencyHigh__s1)) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (answeredRight__s1))))
(when (and (not (proficiencyHigh__s1)) (updateTurn__s0)) (probabilistic 1.0 (not (answeredRight__s1))))
(when (and (proficiencyHigh__s1) (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 0.9543038 (answeredRight__s1) 0.045696199999999965 (not (answeredRight__s1))))
(when (and (proficiencyHigh__s1) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (answeredRight__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0)) (probabilistic 1.0 (not (answeredRight__s1))))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (not (answeredRight__s0)) (proficiencyMed__s0) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyMed__s0))))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s0)) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (not (proficiencyHigh__s0)) (updateTurn__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (not (answeredRight__s1)) (proficiencyMed__s1) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyMed__s1))))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (not (hintedRight__s1)) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (not (proficiencyHigh__s1)) (updateTurn__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(probabilistic 1.0 (not (hintDelayVar__s0)))
(probabilistic 1.0 (not (hintDelayVar__s1)))
; Reward
(when (proficiencyHigh__s0) (increase (reward) 1.1778302))
(when (proficiencyHigh__s1) (increase (reward) 1.2346091))
(when (not (proficiencyMed__s0)) (decrease (reward) 1.1778302))
(when (not (proficiencyMed__s1)) (decrease (reward) 1.2346091))
)
)
(:action giveHint__s0
:effect (and
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (hintedRight__s0) ))
(when (and (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (hintedRight__s0))))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (hintedRight__s0))))
(probabilistic 1.0 (not (hintedRight__s1)))
(when (and (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0) (proficiencyMed__s0)) (probabilistic 1.0 (proficiencyHigh__s0) ))
(when (and (proficiencyHigh__s0) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 0.04352919459342952 (not (proficiencyHigh__s0))))
(when (and (proficiencyHigh__s0) (updateTurn__s0) (not (answeredRight__s0)) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyHigh__s0))))
(when (and (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1) (proficiencyMed__s1)) (probabilistic 1.0 (proficiencyHigh__s1) ))
(when (and (proficiencyHigh__s1) (not (updateTurn__s0)) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (not (updateTurn__s1))) (probabilistic 0.018769168853759788 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (updateTurn__s0) ))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (updateTurn__s0))))
(probabilistic 1.0 (not (updateTurn__s1)))
(probabilistic 1.0 (not (answeredRight__s0)))
(probabilistic 1.0 (not (answeredRight__s1)))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (not (answeredRight__s0)) (proficiencyMed__s0) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyMed__s0))))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s0)) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (not (proficiencyHigh__s0)) (updateTurn__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (not (answeredRight__s1)) (proficiencyMed__s1) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyMed__s1))))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (not (hintedRight__s1)) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (not (proficiencyHigh__s1)) (updateTurn__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (hintDelayVar__s0) ))
(when (and (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (hintDelayVar__s0))))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (hintDelayVar__s0))))
(probabilistic 1.0 (not (hintDelayVar__s1)))
; Reward
(when (proficiencyHigh__s0) (increase (reward) 1.1778302))
(when (proficiencyHigh__s1) (increase (reward) 1.2346091))
(when (not (proficiencyMed__s0)) (decrease (reward) 1.1778302))
(when (not (proficiencyMed__s1)) (decrease (reward) 1.2346091))
)
)
(:action giveHint__s1
:effect (and
(probabilistic 1.0 (not (hintedRight__s0)))
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (hintedRight__s1) ))
(when (and (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (hintedRight__s1))))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (hintedRight__s1))))
(when (and (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0) (proficiencyMed__s0)) (probabilistic 1.0 (proficiencyHigh__s0) ))
(when (and (proficiencyHigh__s0) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 0.04352919459342952 (not (proficiencyHigh__s0))))
(when (and (proficiencyHigh__s0) (updateTurn__s0) (not (answeredRight__s0)) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyHigh__s0))))
(when (and (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1) (proficiencyMed__s1)) (probabilistic 1.0 (proficiencyHigh__s1) ))
(when (and (proficiencyHigh__s1) (not (updateTurn__s0)) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (not (updateTurn__s1))) (probabilistic 0.018769168853759788 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(probabilistic 1.0 (not (updateTurn__s0)))
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (updateTurn__s1) ))
(when (and (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (updateTurn__s1))))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (updateTurn__s1))))
(probabilistic 1.0 (not (answeredRight__s0)))
(probabilistic 1.0 (not (answeredRight__s1)))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (not (answeredRight__s0)) (proficiencyMed__s0) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyMed__s0))))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s0)) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (not (proficiencyHigh__s0)) (updateTurn__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (not (answeredRight__s1)) (proficiencyMed__s1) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyMed__s1))))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (not (hintedRight__s1)) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (not (proficiencyHigh__s1)) (updateTurn__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(probabilistic 1.0 (not (hintDelayVar__s0)))
(when (and (not (updateTurn__s0)) (not (updateTurn__s1))) (probabilistic 1.0 (hintDelayVar__s1) ))
(when (and (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 1.0 (not (hintDelayVar__s1))))
(when (and (updateTurn__s0)) (probabilistic 1.0 (not (hintDelayVar__s1))))
; Reward
(when (proficiencyHigh__s0) (increase (reward) 1.1778302))
(when (proficiencyHigh__s1) (increase (reward) 1.2346091))
(when (not (proficiencyMed__s0)) (decrease (reward) 1.1778302))
(when (not (proficiencyMed__s1)) (decrease (reward) 1.2346091))
)
)
(:action noop
:effect (and
(probabilistic 1.0 (not (hintedRight__s0)))
(probabilistic 1.0 (not (hintedRight__s1)))
(when (and (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0) (proficiencyMed__s0)) (probabilistic 1.0 (proficiencyHigh__s0) ))
(when (and (proficiencyHigh__s0) (not (updateTurn__s0)) (updateTurn__s1)) (probabilistic 0.04352919459342952 (not (proficiencyHigh__s0))))
(when (and (proficiencyHigh__s0) (updateTurn__s0) (not (answeredRight__s0)) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyHigh__s0))))
(when (and (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1) (proficiencyMed__s1)) (probabilistic 1.0 (proficiencyHigh__s1) ))
(when (and (proficiencyHigh__s1) (not (updateTurn__s0)) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (not (updateTurn__s1))) (probabilistic 0.018769168853759788 (not (proficiencyHigh__s1))))
(when (and (proficiencyHigh__s1) (updateTurn__s0) (updateTurn__s1) (not (answeredRight__s1)) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyHigh__s1))))
(probabilistic 1.0 (not (updateTurn__s0)))
(probabilistic 1.0 (not (updateTurn__s1)))
(probabilistic 1.0 (not (answeredRight__s0)))
(probabilistic 1.0 (not (answeredRight__s1)))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (not (answeredRight__s0)) (proficiencyMed__s0) (not (hintDelayVar__s0))) (probabilistic 1.0 (not (proficiencyMed__s0))))
(when (and (not (hintedRight__s0)) (not (proficiencyHigh__s0)) (updateTurn__s0) (answeredRight__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s0)) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (not (proficiencyHigh__s0)) (updateTurn__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (hintedRight__s0) (proficiencyHigh__s0)) (probabilistic 1.0 (proficiencyMed__s0) ))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (not (answeredRight__s1)) (proficiencyMed__s1) (not (hintDelayVar__s1))) (probabilistic 1.0 (not (proficiencyMed__s1))))
(when (and (not (hintedRight__s1)) (not (proficiencyHigh__s1)) (updateTurn__s1) (answeredRight__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (not (hintedRight__s1)) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (not (proficiencyHigh__s1)) (updateTurn__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(when (and (hintedRight__s1) (proficiencyHigh__s1)) (probabilistic 1.0 (proficiencyMed__s1) ))
(probabilistic 1.0 (not (hintDelayVar__s0)))
(probabilistic 1.0 (not (hintDelayVar__s1)))
; Reward
(when (proficiencyHigh__s0) (increase (reward) 1.1778302))
(when (proficiencyHigh__s1) (increase (reward) 1.2346091))
(when (not (proficiencyMed__s0)) (decrease (reward) 1.1778302))
(when (not (proficiencyMed__s1)) (decrease (reward) 1.2346091))
)
)
)
(define (problem skill_teaching_inst_mdp__1)
(:domain skill_teaching_mdp)
(:init
)
(:metric maximize (reward))
;; (:horizon 40)
;; (:discount 1.0)
)

Related Posts