diff --git a/doc/smart-switch/pmon/images/dpu-reboot-seq.svg b/doc/smart-switch/pmon/images/dpu-reboot-seq.svg
new file mode 100644
index 0000000000..8182562f92
--- /dev/null
+++ b/doc/smart-switch/pmon/images/dpu-reboot-seq.svg
@@ -0,0 +1 @@
+<svg aria-roledescription="sequence" role="graphics-document document" viewBox="-50 -10 1717.5 946" style="max-width: 1717.5px;" xmlns="http://www.w3.org/2000/svg" width="100%" id="export-svg"><style xmlns="http://www.w3.org/1999/xhtml">@import url("https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.2.0/css/all.min.css"); p {margin: 0;}</style><g><rect class="actor actor-bottom" ry="3" rx="3" name="platform" height="65" width="161" stroke="#666" fill="#eaeaea" y="860" x="1456.5"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="892.5" x="1537"><tspan dy="0" x="1537">NPU: Platform code</tspan></text></g><g><rect class="actor actor-bottom" ry="3" rx="3" name="platform-api" height="65" width="150" stroke="#666" fill="#eaeaea" y="860" x="1222"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="892.5" x="1297"><tspan dy="0" x="1297">NPU: platform API</tspan></text></g><g><rect class="actor actor-bottom" ry="3" rx="3" name="chassisd" height="65" width="150" stroke="#666" fill="#eaeaea" y="860" x="1022"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="892.5" x="1097"><tspan dy="0" x="1097">NPU: chassisd</tspan></text></g><g><rect class="actor actor-bottom" ry="3" rx="3" name="chassis-state-db" height="65" width="176" stroke="#666" fill="#eaeaea" y="860" x="759"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="892.5" x="847"><tspan dy="0" x="847">NPU: chassisStateDB</tspan></text></g><g><rect class="actor actor-bottom" ry="3" rx="3" name="state-db" height="65" width="150" stroke="#666" fill="#eaeaea" y="860" x="559"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="892.5" x="634"><tspan dy="0" x="634">NPU: stateDB</tspan></text></g><g><rect class="actor actor-bottom" ry="3" rx="3" name="host-service" height="65" width="150" stroke="#666" fill="#eaeaea" y="860" x="341"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="892.5" x="416"><tspan dy="0" x="416">NPU: host-service</tspan></text></g><g/><g><line data-id="platform" data-et="life-line" name="platform" stroke="#999" stroke-width="0.5px" class="actor-line 200" y2="860" x2="1537" y1="65" x1="1537" id="actor433"/><g data-id="platform" data-et="participant" id="root-433"><rect class="actor actor-top" ry="3" rx="3" name="platform" height="65" width="161" stroke="#666" fill="#eaeaea" y="0" x="1456.5"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="32.5" x="1537"><tspan dy="0" x="1537">NPU: Platform code</tspan></text></g></g><g><line data-id="platform-api" data-et="life-line" name="platform-api" stroke="#999" stroke-width="0.5px" class="actor-line 200" y2="860" x2="1297" y1="65" x1="1297" id="actor432"/><g data-id="platform-api" data-et="participant" id="root-432"><rect class="actor actor-top" ry="3" rx="3" name="platform-api" height="65" width="150" stroke="#666" fill="#eaeaea" y="0" x="1222"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="32.5" x="1297"><tspan dy="0" x="1297">NPU: platform API</tspan></text></g></g><g><line data-id="chassisd" data-et="life-line" name="chassisd" stroke="#999" stroke-width="0.5px" class="actor-line 200" y2="860" x2="1097" y1="65" x1="1097" id="actor431"/><g data-id="chassisd" data-et="participant" id="root-431"><rect class="actor actor-top" ry="3" rx="3" name="chassisd" height="65" width="150" stroke="#666" fill="#eaeaea" y="0" x="1022"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="32.5" x="1097"><tspan dy="0" x="1097">NPU: chassisd</tspan></text></g></g><g><line data-id="chassis-state-db" data-et="life-line" name="chassis-state-db" stroke="#999" stroke-width="0.5px" class="actor-line 200" y2="860" x2="847" y1="65" x1="847" id="actor430"/><g data-id="chassis-state-db" data-et="participant" id="root-430"><rect class="actor actor-top" ry="3" rx="3" name="chassis-state-db" height="65" width="176" stroke="#666" fill="#eaeaea" y="0" x="759"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="32.5" x="847"><tspan dy="0" x="847">NPU: chassisStateDB</tspan></text></g></g><g><line data-id="state-db" data-et="life-line" name="state-db" stroke="#999" stroke-width="0.5px" class="actor-line 200" y2="860" x2="634" y1="65" x1="634" id="actor429"/><g data-id="state-db" data-et="participant" id="root-429"><rect class="actor actor-top" ry="3" rx="3" name="state-db" height="65" width="150" stroke="#666" fill="#eaeaea" y="0" x="559"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="32.5" x="634"><tspan dy="0" x="634">NPU: stateDB</tspan></text></g></g><g><line data-id="host-service" data-et="life-line" name="host-service" stroke="#999" stroke-width="0.5px" class="actor-line 200" y2="860" x2="416" y1="65" x1="416" id="actor428"/><g data-id="host-service" data-et="participant" id="root-428"><rect class="actor actor-top" ry="3" rx="3" name="host-service" height="65" width="150" stroke="#666" fill="#eaeaea" y="0" x="341"/><text class="actor actor-box" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="32.5" x="416"><tspan dy="0" x="416">NPU: host-service</tspan></text></g></g><g><line data-id="Customer" data-et="life-line" name="Customer" stroke="#999" stroke-width="0.5px" class="actor-line 200" y2="860" x2="75" y1="80" x1="75" id="actor427"/></g><style>#export-svg{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:14px;fill:#333;}#export-svg .error-icon{fill:#ffffff;}#export-svg .error-text{fill:#000000;stroke:#000000;}#export-svg .edge-thickness-normal{stroke-width:1px;}#export-svg .edge-thickness-thick{stroke-width:3.5px;}#export-svg .edge-pattern-solid{stroke-dasharray:0;}#export-svg .edge-thickness-invisible{stroke-width:0;fill:none;}#export-svg .edge-pattern-dashed{stroke-dasharray:3;}#export-svg .edge-pattern-dotted{stroke-dasharray:2;}#export-svg .marker{fill:#000000;stroke:#000000;}#export-svg .marker.cross{stroke:#000000;}#export-svg svg{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:14px;}#export-svg p{margin:0;}#export-svg .actor{stroke:hsl(0, 0%, 70%);fill:#ffffff;}#export-svg text.actor&gt;tspan{fill:#333;stroke:none;}#export-svg .actor-line{stroke:hsl(0, 0%, 70%);}#export-svg .messageLine0{stroke-width:1.5;stroke-dasharray:none;stroke:#333;}#export-svg .messageLine1{stroke-width:1.5;stroke-dasharray:2,2;stroke:#333;}#export-svg #arrowhead path{fill:#333;stroke:#333;}#export-svg .sequenceNumber{fill:#ffffff;}#export-svg #sequencenumber{fill:#333;}#export-svg #crosshead path{fill:#333;stroke:#333;}#export-svg .messageText{fill:#333;stroke:none;}#export-svg .labelBox{stroke:hsl(0, 0%, 70%);fill:#ffffff;}#export-svg .labelText,#export-svg .labelText&gt;tspan{fill:#333;stroke:none;}#export-svg .loopText,#export-svg .loopText&gt;tspan{fill:#333;stroke:none;}#export-svg .loopLine{stroke-width:2px;stroke-dasharray:2,2;stroke:hsl(0, 0%, 70%);fill:hsl(0, 0%, 70%);}#export-svg .note{stroke:hsl(52.6829268293, 60%, 73.9215686275%);fill:#fff5ad;}#export-svg .noteText,#export-svg .noteText&gt;tspan{fill:#333;stroke:none;}#export-svg .activation0{fill:hsl(-120, 0%, 80%);stroke:hsl(-120, 0%, 70%);}#export-svg .activation1{fill:hsl(-120, 0%, 80%);stroke:hsl(-120, 0%, 70%);}#export-svg .activation2{fill:hsl(-120, 0%, 80%);stroke:hsl(-120, 0%, 70%);}#export-svg .actorPopupMenu{position:absolute;}#export-svg .actorPopupMenuPanel{position:absolute;fill:#ffffff;box-shadow:0px 8px 16px 0px rgba(0,0,0,0.2);filter:drop-shadow(3px 5px 2px rgb(0 0 0 / 0.4));}#export-svg .actor-man line{stroke:hsl(0, 0%, 70%);fill:#ffffff;}#export-svg .actor-man circle,#export-svg line{stroke:hsl(0, 0%, 70%);fill:#ffffff;stroke-width:2px;}#export-svg .node .neo-node{stroke:#000000;}#export-svg [data-look="neo"].node rect,#export-svg [data-look="neo"].cluster rect,#export-svg [data-look="neo"].node polygon{stroke:url(#export-svg-gradient);filter:drop-shadow( 0px 1px 2px rgba(0, 0, 0, 0.25));}#export-svg [data-look="neo"].node rect,#export-svg [data-look="neo"].node polygon,#export-svg [data-look="neo"].node path{stroke:url(#export-svg-gradient);filter:drop-shadow( 0px 1px 2px rgba(0, 0, 0, 0.25));}#export-svg [data-look="neo"].node .neo-line path{stroke:hsl(0, 0%, 70%);filter:none;}#export-svg [data-look="neo"].node circle{stroke:url(#export-svg-gradient);filter:drop-shadow( 0px 1px 2px rgba(0, 0, 0, 0.25));}#export-svg [data-look="neo"].node circle .state-start{fill:#000000;}#export-svg [data-look="neo"].statediagram-cluster rect{fill:#ffffff;stroke:url(#export-svg-gradient);stroke-width:1px;}#export-svg [data-look="neo"].icon-shape .icon{fill:url(#export-svg-gradient);filter:drop-shadow( 0px 1px 2px rgba(0, 0, 0, 0.25));}#export-svg [data-look="neo"].icon-shape .icon-neo path{stroke:url(#export-svg-gradient);filter:drop-shadow( 0px 1px 2px rgba(0, 0, 0, 0.25));}#export-svg :root{--mermaid-font-family:"trebuchet ms",verdana,arial,sans-serif;}</style><g/><defs><symbol height="24" width="24" id="computer"><path d="M2 2v13h20v-13h-20zm18 11h-16v-9h16v9zm-10.228 6l.466-1h3.524l.467 1h-4.457zm14.228 3h-24l2-6h2.104l-1.33 4h18.45l-1.297-4h2.073l2 6zm-5-10h-14v-7h14v7z" transform="scale(.5)"/></symbol></defs><defs><symbol clip-rule="evenodd" fill-rule="evenodd" id="database"><path d="M12.258.001l.256.004.255.005.253.008.251.01.249.012.247.015.246.016.242.019.241.02.239.023.236.024.233.027.231.028.229.031.225.032.223.034.22.036.217.038.214.04.211.041.208.043.205.045.201.046.198.048.194.05.191.051.187.053.183.054.18.056.175.057.172.059.168.06.163.061.16.063.155.064.15.066.074.033.073.033.071.034.07.034.069.035.068.035.067.035.066.035.064.036.064.036.062.036.06.036.06.037.058.037.058.037.055.038.055.038.053.038.052.038.051.039.05.039.048.039.047.039.045.04.044.04.043.04.041.04.04.041.039.041.037.041.036.041.034.041.033.042.032.042.03.042.029.042.027.042.026.043.024.043.023.043.021.043.02.043.018.044.017.043.015.044.013.044.012.044.011.045.009.044.007.045.006.045.004.045.002.045.001.045v17l-.001.045-.002.045-.004.045-.006.045-.007.045-.009.044-.011.045-.012.044-.013.044-.015.044-.017.043-.018.044-.02.043-.021.043-.023.043-.024.043-.026.043-.027.042-.029.042-.03.042-.032.042-.033.042-.034.041-.036.041-.037.041-.039.041-.04.041-.041.04-.043.04-.044.04-.045.04-.047.039-.048.039-.05.039-.051.039-.052.038-.053.038-.055.038-.055.038-.058.037-.058.037-.06.037-.06.036-.062.036-.064.036-.064.036-.066.035-.067.035-.068.035-.069.035-.07.034-.071.034-.073.033-.074.033-.15.066-.155.064-.16.063-.163.061-.168.06-.172.059-.175.057-.18.056-.183.054-.187.053-.191.051-.194.05-.198.048-.201.046-.205.045-.208.043-.211.041-.214.04-.217.038-.22.036-.223.034-.225.032-.229.031-.231.028-.233.027-.236.024-.239.023-.241.02-.242.019-.246.016-.247.015-.249.012-.251.01-.253.008-.255.005-.256.004-.258.001-.258-.001-.256-.004-.255-.005-.253-.008-.251-.01-.249-.012-.247-.015-.245-.016-.243-.019-.241-.02-.238-.023-.236-.024-.234-.027-.231-.028-.228-.031-.226-.032-.223-.034-.22-.036-.217-.038-.214-.04-.211-.041-.208-.043-.204-.045-.201-.046-.198-.048-.195-.05-.19-.051-.187-.053-.184-.054-.179-.056-.176-.057-.172-.059-.167-.06-.164-.061-.159-.063-.155-.064-.151-.066-.074-.033-.072-.033-.072-.034-.07-.034-.069-.035-.068-.035-.067-.035-.066-.035-.064-.036-.063-.036-.062-.036-.061-.036-.06-.037-.058-.037-.057-.037-.056-.038-.055-.038-.053-.038-.052-.038-.051-.039-.049-.039-.049-.039-.046-.039-.046-.04-.044-.04-.043-.04-.041-.04-.04-.041-.039-.041-.037-.041-.036-.041-.034-.041-.033-.042-.032-.042-.03-.042-.029-.042-.027-.042-.026-.043-.024-.043-.023-.043-.021-.043-.02-.043-.018-.044-.017-.043-.015-.044-.013-.044-.012-.044-.011-.045-.009-.044-.007-.045-.006-.045-.004-.045-.002-.045-.001-.045v-17l.001-.045.002-.045.004-.045.006-.045.007-.045.009-.044.011-.045.012-.044.013-.044.015-.044.017-.043.018-.044.02-.043.021-.043.023-.043.024-.043.026-.043.027-.042.029-.042.03-.042.032-.042.033-.042.034-.041.036-.041.037-.041.039-.041.04-.041.041-.04.043-.04.044-.04.046-.04.046-.039.049-.039.049-.039.051-.039.052-.038.053-.038.055-.038.056-.038.057-.037.058-.037.06-.037.061-.036.062-.036.063-.036.064-.036.066-.035.067-.035.068-.035.069-.035.07-.034.072-.034.072-.033.074-.033.151-.066.155-.064.159-.063.164-.061.167-.06.172-.059.176-.057.179-.056.184-.054.187-.053.19-.051.195-.05.198-.048.201-.046.204-.045.208-.043.211-.041.214-.04.217-.038.22-.036.223-.034.226-.032.228-.031.231-.028.234-.027.236-.024.238-.023.241-.02.243-.019.245-.016.247-.015.249-.012.251-.01.253-.008.255-.005.256-.004.258-.001.258.001zm-9.258 20.499v.01l.001.021.003.021.004.022.005.021.006.022.007.022.009.023.01.022.011.023.012.023.013.023.015.023.016.024.017.023.018.024.019.024.021.024.022.025.023.024.024.025.052.049.056.05.061.051.066.051.07.051.075.051.079.052.084.052.088.052.092.052.097.052.102.051.105.052.11.052.114.051.119.051.123.051.127.05.131.05.135.05.139.048.144.049.147.047.152.047.155.047.16.045.163.045.167.043.171.043.176.041.178.041.183.039.187.039.19.037.194.035.197.035.202.033.204.031.209.03.212.029.216.027.219.025.222.024.226.021.23.02.233.018.236.016.24.015.243.012.246.01.249.008.253.005.256.004.259.001.26-.001.257-.004.254-.005.25-.008.247-.011.244-.012.241-.014.237-.016.233-.018.231-.021.226-.021.224-.024.22-.026.216-.027.212-.028.21-.031.205-.031.202-.034.198-.034.194-.036.191-.037.187-.039.183-.04.179-.04.175-.042.172-.043.168-.044.163-.045.16-.046.155-.046.152-.047.148-.048.143-.049.139-.049.136-.05.131-.05.126-.05.123-.051.118-.052.114-.051.11-.052.106-.052.101-.052.096-.052.092-.052.088-.053.083-.051.079-.052.074-.052.07-.051.065-.051.06-.051.056-.05.051-.05.023-.024.023-.025.021-.024.02-.024.019-.024.018-.024.017-.024.015-.023.014-.024.013-.023.012-.023.01-.023.01-.022.008-.022.006-.022.006-.022.004-.022.004-.021.001-.021.001-.021v-4.127l-.077.055-.08.053-.083.054-.085.053-.087.052-.09.052-.093.051-.095.05-.097.05-.1.049-.102.049-.105.048-.106.047-.109.047-.111.046-.114.045-.115.045-.118.044-.12.043-.122.042-.124.042-.126.041-.128.04-.13.04-.132.038-.134.038-.135.037-.138.037-.139.035-.142.035-.143.034-.144.033-.147.032-.148.031-.15.03-.151.03-.153.029-.154.027-.156.027-.158.026-.159.025-.161.024-.162.023-.163.022-.165.021-.166.02-.167.019-.169.018-.169.017-.171.016-.173.015-.173.014-.175.013-.175.012-.177.011-.178.01-.179.008-.179.008-.181.006-.182.005-.182.004-.184.003-.184.002h-.37l-.184-.002-.184-.003-.182-.004-.182-.005-.181-.006-.179-.008-.179-.008-.178-.01-.176-.011-.176-.012-.175-.013-.173-.014-.172-.015-.171-.016-.17-.017-.169-.018-.167-.019-.166-.02-.165-.021-.163-.022-.162-.023-.161-.024-.159-.025-.157-.026-.156-.027-.155-.027-.153-.029-.151-.03-.15-.03-.148-.031-.146-.032-.145-.033-.143-.034-.141-.035-.14-.035-.137-.037-.136-.037-.134-.038-.132-.038-.13-.04-.128-.04-.126-.041-.124-.042-.122-.042-.12-.044-.117-.043-.116-.045-.113-.045-.112-.046-.109-.047-.106-.047-.105-.048-.102-.049-.1-.049-.097-.05-.095-.05-.093-.052-.09-.051-.087-.052-.085-.053-.083-.054-.08-.054-.077-.054v4.127zm0-5.654v.011l.001.021.003.021.004.021.005.022.006.022.007.022.009.022.01.022.011.023.012.023.013.023.015.024.016.023.017.024.018.024.019.024.021.024.022.024.023.025.024.024.052.05.056.05.061.05.066.051.07.051.075.052.079.051.084.052.088.052.092.052.097.052.102.052.105.052.11.051.114.051.119.052.123.05.127.051.131.05.135.049.139.049.144.048.147.048.152.047.155.046.16.045.163.045.167.044.171.042.176.042.178.04.183.04.187.038.19.037.194.036.197.034.202.033.204.032.209.03.212.028.216.027.219.025.222.024.226.022.23.02.233.018.236.016.24.014.243.012.246.01.249.008.253.006.256.003.259.001.26-.001.257-.003.254-.006.25-.008.247-.01.244-.012.241-.015.237-.016.233-.018.231-.02.226-.022.224-.024.22-.025.216-.027.212-.029.21-.03.205-.032.202-.033.198-.035.194-.036.191-.037.187-.039.183-.039.179-.041.175-.042.172-.043.168-.044.163-.045.16-.045.155-.047.152-.047.148-.048.143-.048.139-.05.136-.049.131-.05.126-.051.123-.051.118-.051.114-.052.11-.052.106-.052.101-.052.096-.052.092-.052.088-.052.083-.052.079-.052.074-.051.07-.052.065-.051.06-.05.056-.051.051-.049.023-.025.023-.024.021-.025.02-.024.019-.024.018-.024.017-.024.015-.023.014-.023.013-.024.012-.022.01-.023.01-.023.008-.022.006-.022.006-.022.004-.021.004-.022.001-.021.001-.021v-4.139l-.077.054-.08.054-.083.054-.085.052-.087.053-.09.051-.093.051-.095.051-.097.05-.1.049-.102.049-.105.048-.106.047-.109.047-.111.046-.114.045-.115.044-.118.044-.12.044-.122.042-.124.042-.126.041-.128.04-.13.039-.132.039-.134.038-.135.037-.138.036-.139.036-.142.035-.143.033-.144.033-.147.033-.148.031-.15.03-.151.03-.153.028-.154.028-.156.027-.158.026-.159.025-.161.024-.162.023-.163.022-.165.021-.166.02-.167.019-.169.018-.169.017-.171.016-.173.015-.173.014-.175.013-.175.012-.177.011-.178.009-.179.009-.179.007-.181.007-.182.005-.182.004-.184.003-.184.002h-.37l-.184-.002-.184-.003-.182-.004-.182-.005-.181-.007-.179-.007-.179-.009-.178-.009-.176-.011-.176-.012-.175-.013-.173-.014-.172-.015-.171-.016-.17-.017-.169-.018-.167-.019-.166-.02-.165-.021-.163-.022-.162-.023-.161-.024-.159-.025-.157-.026-.156-.027-.155-.028-.153-.028-.151-.03-.15-.03-.148-.031-.146-.033-.145-.033-.143-.033-.141-.035-.14-.036-.137-.036-.136-.037-.134-.038-.132-.039-.13-.039-.128-.04-.126-.041-.124-.042-.122-.043-.12-.043-.117-.044-.116-.044-.113-.046-.112-.046-.109-.046-.106-.047-.105-.048-.102-.049-.1-.049-.097-.05-.095-.051-.093-.051-.09-.051-.087-.053-.085-.052-.083-.054-.08-.054-.077-.054v4.139zm0-5.666v.011l.001.02.003.022.004.021.005.022.006.021.007.022.009.023.01.022.011.023.012.023.013.023.015.023.016.024.017.024.018.023.019.024.021.025.022.024.023.024.024.025.052.05.056.05.061.05.066.051.07.051.075.052.079.051.084.052.088.052.092.052.097.052.102.052.105.051.11.052.114.051.119.051.123.051.127.05.131.05.135.05.139.049.144.048.147.048.152.047.155.046.16.045.163.045.167.043.171.043.176.042.178.04.183.04.187.038.19.037.194.036.197.034.202.033.204.032.209.03.212.028.216.027.219.025.222.024.226.021.23.02.233.018.236.017.24.014.243.012.246.01.249.008.253.006.256.003.259.001.26-.001.257-.003.254-.006.25-.008.247-.01.244-.013.241-.014.237-.016.233-.018.231-.02.226-.022.224-.024.22-.025.216-.027.212-.029.21-.03.205-.032.202-.033.198-.035.194-.036.191-.037.187-.039.183-.039.179-.041.175-.042.172-.043.168-.044.163-.045.16-.045.155-.047.152-.047.148-.048.143-.049.139-.049.136-.049.131-.051.126-.05.123-.051.118-.052.114-.051.11-.052.106-.052.101-.052.096-.052.092-.052.088-.052.083-.052.079-.052.074-.052.07-.051.065-.051.06-.051.056-.05.051-.049.023-.025.023-.025.021-.024.02-.024.019-.024.018-.024.017-.024.015-.023.014-.024.013-.023.012-.023.01-.022.01-.023.008-.022.006-.022.006-.022.004-.022.004-.021.001-.021.001-.021v-4.153l-.077.054-.08.054-.083.053-.085.053-.087.053-.09.051-.093.051-.095.051-.097.05-.1.049-.102.048-.105.048-.106.048-.109.046-.111.046-.114.046-.115.044-.118.044-.12.043-.122.043-.124.042-.126.041-.128.04-.13.039-.132.039-.134.038-.135.037-.138.036-.139.036-.142.034-.143.034-.144.033-.147.032-.148.032-.15.03-.151.03-.153.028-.154.028-.156.027-.158.026-.159.024-.161.024-.162.023-.163.023-.165.021-.166.02-.167.019-.169.018-.169.017-.171.016-.173.015-.173.014-.175.013-.175.012-.177.01-.178.01-.179.009-.179.007-.181.006-.182.006-.182.004-.184.003-.184.001-.185.001-.185-.001-.184-.001-.184-.003-.182-.004-.182-.006-.181-.006-.179-.007-.179-.009-.178-.01-.176-.01-.176-.012-.175-.013-.173-.014-.172-.015-.171-.016-.17-.017-.169-.018-.167-.019-.166-.02-.165-.021-.163-.023-.162-.023-.161-.024-.159-.024-.157-.026-.156-.027-.155-.028-.153-.028-.151-.03-.15-.03-.148-.032-.146-.032-.145-.033-.143-.034-.141-.034-.14-.036-.137-.036-.136-.037-.134-.038-.132-.039-.13-.039-.128-.041-.126-.041-.124-.041-.122-.043-.12-.043-.117-.044-.116-.044-.113-.046-.112-.046-.109-.046-.106-.048-.105-.048-.102-.048-.1-.05-.097-.049-.095-.051-.093-.051-.09-.052-.087-.052-.085-.053-.083-.053-.08-.054-.077-.054v4.153zm8.74-8.179l-.257.004-.254.005-.25.008-.247.011-.244.012-.241.014-.237.016-.233.018-.231.021-.226.022-.224.023-.22.026-.216.027-.212.028-.21.031-.205.032-.202.033-.198.034-.194.036-.191.038-.187.038-.183.04-.179.041-.175.042-.172.043-.168.043-.163.045-.16.046-.155.046-.152.048-.148.048-.143.048-.139.049-.136.05-.131.05-.126.051-.123.051-.118.051-.114.052-.11.052-.106.052-.101.052-.096.052-.092.052-.088.052-.083.052-.079.052-.074.051-.07.052-.065.051-.06.05-.056.05-.051.05-.023.025-.023.024-.021.024-.02.025-.019.024-.018.024-.017.023-.015.024-.014.023-.013.023-.012.023-.01.023-.01.022-.008.022-.006.023-.006.021-.004.022-.004.021-.001.021-.001.021.001.021.001.021.004.021.004.022.006.021.006.023.008.022.01.022.01.023.012.023.013.023.014.023.015.024.017.023.018.024.019.024.02.025.021.024.023.024.023.025.051.05.056.05.06.05.065.051.07.052.074.051.079.052.083.052.088.052.092.052.096.052.101.052.106.052.11.052.114.052.118.051.123.051.126.051.131.05.136.05.139.049.143.048.148.048.152.048.155.046.16.046.163.045.168.043.172.043.175.042.179.041.183.04.187.038.191.038.194.036.198.034.202.033.205.032.21.031.212.028.216.027.22.026.224.023.226.022.231.021.233.018.237.016.241.014.244.012.247.011.25.008.254.005.257.004.26.001.26-.001.257-.004.254-.005.25-.008.247-.011.244-.012.241-.014.237-.016.233-.018.231-.021.226-.022.224-.023.22-.026.216-.027.212-.028.21-.031.205-.032.202-.033.198-.034.194-.036.191-.038.187-.038.183-.04.179-.041.175-.042.172-.043.168-.043.163-.045.16-.046.155-.046.152-.048.148-.048.143-.048.139-.049.136-.05.131-.05.126-.051.123-.051.118-.051.114-.052.11-.052.106-.052.101-.052.096-.052.092-.052.088-.052.083-.052.079-.052.074-.051.07-.052.065-.051.06-.05.056-.05.051-.05.023-.025.023-.024.021-.024.02-.025.019-.024.018-.024.017-.023.015-.024.014-.023.013-.023.012-.023.01-.023.01-.022.008-.022.006-.023.006-.021.004-.022.004-.021.001-.021.001-.021-.001-.021-.001-.021-.004-.021-.004-.022-.006-.021-.006-.023-.008-.022-.01-.022-.01-.023-.012-.023-.013-.023-.014-.023-.015-.024-.017-.023-.018-.024-.019-.024-.02-.025-.021-.024-.023-.024-.023-.025-.051-.05-.056-.05-.06-.05-.065-.051-.07-.052-.074-.051-.079-.052-.083-.052-.088-.052-.092-.052-.096-.052-.101-.052-.106-.052-.11-.052-.114-.052-.118-.051-.123-.051-.126-.051-.131-.05-.136-.05-.139-.049-.143-.048-.148-.048-.152-.048-.155-.046-.16-.046-.163-.045-.168-.043-.172-.043-.175-.042-.179-.041-.183-.04-.187-.038-.191-.038-.194-.036-.198-.034-.202-.033-.205-.032-.21-.031-.212-.028-.216-.027-.22-.026-.224-.023-.226-.022-.231-.021-.233-.018-.237-.016-.241-.014-.244-.012-.247-.011-.25-.008-.254-.005-.257-.004-.26-.001-.26.001z" transform="scale(.5)"/></symbol></defs><defs><symbol height="24" width="24" id="clock"><path d="M12 2c5.514 0 10 4.486 10 10s-4.486 10-10 10-10-4.486-10-10 4.486-10 10-10zm0-2c-6.627 0-12 5.373-12 12s5.373 12 12 12 12-5.373 12-12-5.373-12-12-12zm5.848 12.459c.202.038.202.333.001.372-1.907.361-6.045 1.111-6.547 1.111-.719 0-1.301-.582-1.301-1.301 0-.512.77-5.447 1.125-7.445.034-.192.312-.181.343.014l.985 6.238 5.394 1.011z" transform="scale(.5)"/></symbol></defs><defs><marker orient="auto-start-reverse" markerHeight="12" markerWidth="12" markerUnits="userSpaceOnUse" refY="5" refX="7.9" id="arrowhead"><path d="M -1 0 L 10 5 L 0 10 z"/></marker></defs><defs><marker refY="4.5" refX="4" orient="auto" markerHeight="8" markerWidth="15" id="crosshead"><path style="stroke-dasharray: 0, 0;" d="M 1,2 L 6,7 M 6,2 L 1,7" stroke-width="1pt" stroke="#000000" fill="none"/></marker></defs><defs><marker orient="auto" markerHeight="28" markerWidth="20" refY="7" refX="15.5" id="filled-head"><path d="M 18,7 L9,13 L14,7 L9,1 Z"/></marker></defs><defs><marker orient="auto" markerHeight="40" markerWidth="60" refY="15" refX="15" id="sequencenumber"><circle r="6" cy="15" cx="15"/></marker></defs><g/><g/><g><rect class="activation2" height="166" width="10" stroke="#666" fill="#EDF2AE" y="265" x="421"/></g><g><rect class="activation0" height="274" width="10" stroke="#666" fill="#EDF2AE" y="556" x="1092"/></g><g><rect class="activation0" height="136" width="10" stroke="#666" fill="#EDF2AE" y="602" x="1292"/></g><g><rect class="activation0" height="44" width="10" stroke="#666" fill="#EDF2AE" y="648" x="1532"/></g><g/><g data-id="ibe6965608a" data-et="control-structure"><line class="loopLine" y2="441" x2="1552" y1="441" x1="401"/><line class="loopLine" y2="840" x2="1552" y1="441" x1="1552"/><line class="loopLine" y2="840" x2="1552" y1="840" x1="401"/><line class="loopLine" y2="840" x2="401" y1="441" x1="401"/><polygon class="labelBox" points="401,441 451,441 451,454 442.6,461 401,461"/><text class="labelText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="454" x="426">loop</text><text class="loopText" style="font-size: 16px; font-weight: 400;" text-anchor="middle" y="459" x="1001.5"><tspan x="1001.5">[moduel_db_update]</tspan></text></g><g data-id="Customer" data-et="participant" name="Customer" class="actor-man actor-top"><line y2="45" x2="75" y1="25" x1="75" id="actor-man-torso427"/><line y2="33" x2="93" y1="33" x1="57" id="actor-man-arms427"/><line y2="45" x2="75" y1="60" x1="57"/><line y2="60" x2="91" y1="45" x1="75"/><circle height="65" width="150" r="15" cy="10" cx="75"/><text class="actor actor-man" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="67.5" x="75"><tspan dy="0" x="75">User</tspan></text></g><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="80" x="242">Input: PowerOn or Reboot config or cli</text><line style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="host-service" data-from="Customer" data-id="i9b5ea11f99" data-et="message" class="messageLine0" y2="111" x2="408" y1="111" x1="76"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="126" x="421">determine-reboot-cause</text><path style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="host-service" data-from="host-service" data-id="i7a7586c55d" data-et="message" class="messageLine0" d="M 421,157 C 481,147 481,187 421,177"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="202" x="426">update-reboot-cause</text><path style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="host-service" data-from="host-service" data-id="i4065c2f35a" data-et="message" class="messageLine0" d="M 426,233 C 486,223 486,263 426,253"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="278" x="531">update-reboot-cause</text><line style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="state-db" data-from="host-service" data-id="i1c75c69069" data-et="message" class="messageLine0" y2="309" x2="630" y1="309" x1="431"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="324" x="637">update-reboot-cause</text><line style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="chassis-state-db" data-from="host-service" data-id="if74cbc5203" data-et="message" class="messageLine0" y2="355" x2="843" y1="355" x1="431"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="370" x="431">end processing</text><path style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="host-service" data-from="host-service" data-id="i3ea8b26ead" data-et="message" class="messageLine0" d="M 431,401 C 491,391 491,431 431,421"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="491" x="1098">oper-status out of offline</text><path style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="chassisd" data-from="chassisd" data-id="i7d2b8f0014" data-et="message" class="messageLine0" d="M 1098,524 C 1158,514 1158,554 1098,544"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="569" x="1196">get-reboot-cause</text><line style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="platform-api" data-from="chassisd" data-id="i5dee756ade" data-et="message" class="messageLine0" y2="600" x2="1289" y1="600" x1="1102"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="615" x="1416">xtract-dpu-reboot-cause</text><line style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="platform" data-from="platform-api" data-id="iaf5e148fb8" data-et="message" class="messageLine0" y2="646" x2="1529" y1="646" x1="1302"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="661" x="1419">dpu-reboot-cause</text><line marker-end="url(#arrowhead)" style="stroke-dasharray: 3, 3; fill: none;" stroke="none" stroke-width="2" data-to="platform-api" data-from="platform" data-id="i8579b17111" data-et="message" class="messageLine1" y2="692" x2="1305" y1="692" x1="1532"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="707" x="1199">reboot-cause</text><line marker-end="url(#arrowhead)" style="stroke-dasharray: 3, 3; fill: none;" stroke="none" stroke-width="2" data-to="chassisd" data-from="platform-api" data-id="ib9c8c81dc6" data-et="message" class="messageLine1" y2="738" x2="1105" y1="738" x1="1292"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="753" x="761">persist-dpu-reboot-cause</text><line style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="host-service" data-from="chassisd" data-id="idc8e8af461" data-et="message" class="messageLine0" y2="784" x2="429" y1="784" x1="1092"/><text dy="1em" class="messageText" style="font-size: 16px; font-weight: 400;" alignment-baseline="middle" dominant-baseline="middle" text-anchor="middle" y="799" x="972">update-dpu-reboot-cause</text><line style="fill: none;" marker-end="url(#arrowhead)" stroke="none" stroke-width="2" data-to="chassis-state-db" data-from="chassisd" data-id="ieb9e30d242" data-et="message" class="messageLine0" y2="830" x2="851" y1="830" x1="1092"/><g name="Customer" class="actor-man actor-bottom"><line y2="905" x2="75" y1="885" x1="75" id="actor-man-torso433"/><line y2="893" x2="93" y1="893" x1="57" id="actor-man-arms433"/><line y2="905" x2="75" y1="920" x1="57"/><line y2="920" x2="91" y1="905" x1="75"/><circle height="65" width="150" r="15" cy="870" cx="75"/><text class="actor actor-man" alignment-baseline="central" dominant-baseline="central" style="text-anchor: middle; font-size: 16px; font-weight: 400;" y="927.5" x="75"><tspan dy="0" x="75">User</tspan></text></g></svg>
\ No newline at end of file
diff --git a/doc/smart-switch/pmon/smartswitch-pmon.md b/doc/smart-switch/pmon/smartswitch-pmon.md
index 2c95cbb385..9c58b1bfd0 100644
--- a/doc/smart-switch/pmon/smartswitch-pmon.md
+++ b/doc/smart-switch/pmon/smartswitch-pmon.md
@@ -5,6 +5,7 @@
 | 0.1 | 12/02/2023 | Ramesh Raghupathy | Initial version|
 | 0.2 | 01/08/2024 | Ramesh Raghupathy | Updated API, CPI sections and addressed review comments |
 | 0.3 | 02/26/2024 | Ramesh Raghupathy | Addressed review comments |
+| 0.4 | 06/06/2024 | Ramesh Raghupathy | Added schema for DPU health-info and called out phase:1 and phase:2 activities for DPU health-info. Added key suffix to module reboot-cause to avoid key conflicts |
 
 ## Definitions / Abbreviations
 
@@ -60,7 +61,7 @@ The picture below highlights the PMON vertical and its association with other lo
 * The SmartSwitch host PMON should be able to Startup, Shutdown, Restart, and Soft Reboot the entire system or the individual DPUs. The DPU_MODULE will behave like the LINE_CARD_MODULE of a modular chassis with respect to these functions.
 
 ### SmartSwitch Power up/down sequence:
-* When the smartswitch device is booted, the host will boot first and leave the DPUs either up or down depending on the configuration. The DPUs will be up by default.
+* When the smartswitch device is booted, the host will boot first and leave the DPUs down by default.
 * This section describes the cold startup, shutdown, restart and soft reboot. 
 
 ### Cold Startup
@@ -77,7 +78,7 @@ The picture below highlights the PMON vertical and its association with other lo
 #### DPU cold startup Sequence
 * The chassis is powered up and the host is booting up.
 * The switch PMON is registered with the configDB state change handler.
-* DPU "admin_status: up" is set in the configDB. When not explicitly configured the default is "up".
+* If the DPU's "admin_status: down" in the configDB, the DPU will remain powered down. The default setting is "down".
 * The switch PMON gets the admin up notification from the configDB
 * The switch PMON invokes the platform API to power on the DPU
 * DPU boots up and attaches itself to the midplane.
@@ -86,12 +87,23 @@ The picture below highlights the PMON vertical and its association with other lo
 ### DPU startup sequence diagram
 <p align="center"><img src="./images/dpu-startup-seq.svg"></p>
 
-### Configuring startup and shutdown
-* The DPUs can be powered down by configuring the admin_status as shown.
-* The corresponding switch configDB table is also shown
+#### 2.1.1 DPUs in dark mode
+* A smartswitch when configured to boot up with all the DPUs in it are powered down upon boot up is referred as DPUs in dark mode.
+* In the dark mode the platform.json file shown in section "3.1.3" will not have the dictionary for the DPUS.
+* The term dark mode is overloaded in some cases where the platform.json may have the dictionary but the config_db.json will have the admin_state of all DPU modules as "down".
+* When platform.json has DPU information, but config DB doesn't have the DPU admin state configuration, the DPUs should be in downstate.
+* Default mode on smartswitch is dark mode, unless platform.json configures it to be in light up mode.
+* The DPUs would stay power down in dark mode and will not consume power.
+
+#### 2.1.2 Configuring startup and shutdown
+* The user can use the “config chassis modules startup DPUx”  to power ON a DPU. Example: “config chassis modules startup DPU0”
+* The “config chassis modules shutdown DPUx” is used to power OFF a DPU. Example: “config chassis modules shutdown DPU0”
+* The DPUs are powered down by configuring the admin_status as shown in the schema
+* The config change event handler running on the chassisd of PMON listens to the config change and sets the corresponding switch configDB table and also triggers the module set_admin_state() API.
+* The platform executes the power ON/OFF sequence
 
 #### config_db.json
-CHASSIS_MODULE table holds the list and configuration of DPU modules in a smartswitch chassis. It allows user to administratively bring down a DPU
+CHASSIS_MODULE table holds the list and configuration of DPU modules in a smartswitch chassis. It allows user to administratively bring down a DPU. The following example assumes four DPUs in the system. Unlike the existing modular chassis configuration in a SmartSwitch a DPU module has to be explicitly configured to be "up", otherwise it be configured in the DB to be down as shown in the example.  The example assumes four DPUs in the system.
 ```
 {
     "CHASSIS_MODULE": {
@@ -99,9 +111,10 @@ CHASSIS_MODULE table holds the list and configuration of DPU modules in a smarts
             "admin_status": "down"
         },
         "DPU1": {
-            "admin_status": "down"
+            "admin_status": "up"
         }
     }
+    Note: There is no config for DPU2, DPU3 and the default is "down" as shown below
 }
 ```
 #### switch configDB
@@ -111,6 +124,21 @@ Key: "CHASSIS_MODULE|DPU0"
         "value": {
             "admin_status":"down"
         }
+    },
+    "CHASSIS_MODULE|DPU1": {
+        "value": {
+            "admin_status":"up"
+        }
+    },
+    "CHASSIS_MODULE|DPU2": {
+        "value": {
+            "admin_status":"down"
+        }
+    },
+    "CHASSIS_MODULE|DPU3": {
+        "value": {
+            "admin_status":"down"
+        }
     }
 ```
 
@@ -127,10 +155,11 @@ Key: "CHASSIS_MODULE|DPU0"
 * DPU: Maintenance, Critical alarm, Service migration, RMA
 #### DPU shutdown sequence
 * There could be two possible sources for DPU shutdown. 1. A configuration change to DPU "admin_status: down" 2. The GNOI logic can trigger it.
-* The GNOI server runs on the DPU even after the DPU is shutdown.
-* The host sends a GNOI signal to shutdown the DPU. The DPU does a pre-shutdown and sends an ack back to the host.
-* Upon receiving the ack or on a timeout the host may trigger the switch PMON to shutdown the DPU.
-* NPU-DPU (GNOI) soft reboot workflow will be captured in another document.
+* The GNOI server runs on the DPU even after the DPU is pre-shutdown and listens until the graceful shutdown finishes.
+* The host sends a GNOI signal to shutdown the DPU. The DPU does a graceful-shutdown if not already done and sends an ack back to the host.
+* Upon receiving the ack or on a timeout the host may trigger the switch PMON vendor API to shutdown the DPU.
+* If a vendor specific API is not defined, detachment is done via sysfs (echo 1 > /sys/bus/pci/devices/XXXX:XX:XX.X/remove).
+* NPU-DPU (GNOI) soft reboot workflow is captured in [reboot-hld.md](https://github.com/sonic-net/SONiC/blob/26f3f4e282f3d2bd4a5c684608897850354f5c30/doc/smart-switch/reboot/reboot-hld.md)
 * In the first option the "admin_status: down" configDB status change event will send a message to the switch PMON.
 * The switch PMON will invoke the module class API "set_admin_state(self, up):" with the state being "down" and the platform in turn will call its API to gracefully shutdown the DPU.  
 * The DPU upon receiving the shutdown message will do a graceful shutdown and send an ack back. The DPU graceful shutdown is vendor specific. The DPU power will be turned off after the graceful shutdown. In case of timeout the platform will force power down.
@@ -158,14 +187,14 @@ Key: "CHASSIS_MODULE|DPU0"
 * DPU: Gracefully restart SONiC on DPU
 #### Trigger
 * Switch: “reboot” command issued on switch console.
-* DPU: “reboot” command issued on DPU console or Switch Software issues GNOI
+* DPU: “reboot” command issued to the DPU or Switch Software issues GNOI
 #### Use case
 * Switch: Fault recovery, Maintenance, debug
-* DPU: Fault recover, Maintenance, debug, Service provisioning
+* DPU: Fault recovery, Maintenance, debug, Service provisioning
 
 #### Onboarding requirements
 * The DPU must provide additional control-plane and data-plane state information, timestamp, etc to DPU_STATE table as explained in the DPU_STATE schema once booted up.
-* When the DPU reboots itself, should log the reboot cause and update the previous-reboot-cause field in the stateDB
+* When the DPU reboots itself, should log the reboot cause and update the previous-reboot-cause field in the stateDB and persist in on the Switch.
 * The reboot-cause history on the switch should provide a holistic view of the reboot cause of the SmartSwitch host CPU, and the reboot-cause of all the DPUs
 * The DPUs should be uniquely identified and the DPU upon boot may get this ID from the host and identify itself.
 * Implement the required API enhancements and new APIs for DPU management (see details in design section)
@@ -179,6 +208,7 @@ Key: "CHASSIS_MODULE|DPU0"
     * The DPUs should provide their state to the host by updating the dpu state data in the DPU_STATE table in the host ChassisStateDB (explained in DB schema). This holds the minimal, viable set of low latency dpu state data and can be consumed by HA, LB, FaultManagement logics.
     * DPUs should be able to store the data using a redis call directly on to the switch chassisStateDB
     * The DPU must provide the state information once it boots its OS to DPU_STATE table.
+    * The chassisd on the NPU-PMON will update the dpu_midplane_link_state, dpu_midplane_link_time, dpu_midplane_link_reason fields whenever there is a dpu_midplane_link_state transition.
 
 * Thermal management
     * Besides additional DPU specific sensors, cooling device changes the logic remains the same.
@@ -189,13 +219,15 @@ Key: "CHASSIS_MODULE|DPU0"
 * Show CLIs
     * Extend existing CLIs such as 'show platform fan/temperature' to support the new HW
     * Extend the modular chassis CLI 'show chassis modules status" to display the detailed DPU states. (See CLIs section)
-    * The data for the CLIs come either from the DBs or through the platform APIs. Example: The reboot-cause history and the DPU_STATE are stored in the ChassisStateDB directly using a redis call and the CLIs access them from the DB. It is upt to the platform implementation on how do they fetch the DPU inventory and health data and store them on the host. For the sake of consistency and efficiency we recommend using the redis call and storing them in the chassisStateDB on the host.
+    * The data for the CLIs come either from the DBs or through the platform APIs. Example: The DPU_STATE data are stored in the ChassisStateDB directly using a redis call and the CLIs access them from the DB. It is upto to the platform implementation on how do they fetch the DPU inventory and health data and store them on the host. For the sake of consistency and efficiency we recommend using the redis call and storing them in the chassisStateDB on the host.
 
 ### 2.3. Detect and Debug
 * Health
     * SmartSwitch DPUs should store their health data locally and also provide it to the host for a consolidated view of the CLIs
     * DPUs should support a CLI to display the health data “show system-health ...” (See CLIs section)
-    * The host pmon should use this data to support the host side CLIs. Though accessing this data from DPUs and storing them on the switch is implementation specific it is recommended to use redis call and store them on the switch chassisStateDB for faster access. use "UserDefinedChecker" class to provide this data to the CLIs.
+    * The host pmon should use this data to support the host side CLIs. Though accessing this data from DPUs and storing them on the switch is implementation specific it is recommended to use redis call and store them on the switch chassisStateDB for faster access.
+    * This is done in two phases. Please refer to section:3.1.5.1 for the HEALTH_INFO schema
+    * use "UserDefinedChecker" class to provide this data to the CLIs.
     * Vendor specific data such as interrupt events can also be placed in user defined fields under this DB
     * This table already exists in modular chassis design and the DPUs will use this just like a line card.
 * Alarm and Syslog
@@ -219,7 +251,6 @@ SmartSwitch PMON block diagram
 
 ### 3.1. Platform monitoring and management
 * SmartSwitch design Extends the existing chassis_base class and module_base class as described below.
-* Extend MODULE_TYPE in ModuleBase class with MODULE_TYPE_DPU and MODULE_TYPE_SWITCH to support SmartSwitch
 
 #### 3.1.1 ChassisBase class API enhancements
 is_modular_chassis(self):
@@ -280,7 +311,7 @@ get_dpu_id(self, name):
     Retrieves the DPU ID for the given dpu-module name. Returns None for non-smartswitch chassis.
 
     Returns:
-        An integer, indicating the DPU ID Ex: name:DPU0 return value 1, name:DPU1 return value 2, name:DPUX return value X+1
+        An integer, indicating the DPU ID Ex: name:DPU0 return value 0, name:DPU1 return value 1, name:DPUX return value X
 ```
 
 is_smartswitch(self):
@@ -291,42 +322,22 @@ is_smartswitch(self):
       True
 ```
 
-get_module_dpu_data_port(self, index):
-```
-    Retrieves the DPU data port NPU-DPU association represented for the DPU index. Platforms that need to overwrite the platform.json file will use this API
-
-    This is valid only on the Switch and not on DPUs. On the DPUs this can return None
-
-    Args:
-        index: An integer, the index of the module to retrieve
-
-    Returns:
-        NPU-DPU port association: A string Ex: For index: 1 will return the dup0 port association which is "Ethernet224: Ethernet0" where the string left of ":" (Ethernet224) is the NPU port and the string right of ":" (Ethernet0) is the DPU port.
-```
 #### 3.1.3 NPU to DPU data port mapping
-platform.json of NPU/switch will show the NPU to DPU data port mapping. This will be used by services early in the system boot. 
+platform.json of NPU/switch will show the NPU to DPU data port mapping. This will be used by services early in the system boot.
 ```
-{
-    "DPUs" : [
+    "DPUS": [
         {
-        "dpu0": {
-                    "interface": {"Ethernet224": "Ethernet0"}
-        }
-        },
-        {
-        "dpu1": {
-                    "interface": {"Ethernet232": "Ethernet0"}
+            "dpu0": {
+                "interface": {"Ethernet224": "Ethernet0"}
+            },
+            "dpu1": {
+                "interface": {"Ethernet232": "Ethernet0"}
+            },
+            "dpux": {
+                "interface": {"Ethernet2xx": "Ethernet0"}
             },
-        },
-        .
-        .
-        {
-        "dpuX": {
-                    "interface": {"EthernetX": "EthernetY"}
-            }
         }
     ]
-}
 ```
 #### 3.1.4 ModuleBase class API enhancements
 get_base_mac(self):
@@ -367,7 +378,7 @@ get_type(self):
 
     Returns:
         A string, the module-type from one of the predefined types:
-        MODULE_TYPE_SWITCH, MODULE_TYPE_DPU
+        MODULE_TYPE_DPU
 ```
 
 get_oper_status(self):
@@ -403,7 +414,7 @@ reboot(self, reboot_type):
 set_admin_state(self, up):
 ```
     Request to keep the card/DPU in administratively up/down state.
-    Default state is up.
+    Default state is down.
 ```
 
 get_maximum_consumed_power(self):
@@ -436,34 +447,94 @@ is_midplane_reachable(self):
 #### 3.1.5 ModuleBase class new APIs
 
 ##### 3.1.5.1 Need for consistent storage and access of DPU reboot cause, state and health
-1.  The smartswitch needs to know the reboot cause for DPUs. Please refer to the CLI section for the various options and their effects when executed on the switch and DPUs. 
+#### 1 Reboot Cause
+The smartswitch needs to know the reboot cause for the NPU and the DPUs.
 
-* Each DPU will update its reboot cause history in the Switch ChasissStateDB upon boot up. The recent reboot-cause can be derived from that list of reboot-causes.
-* The get_reboot_cause will return the current reboot-cause of the module.
-* For persistent storage of the DPU reboot-cause and reboot-caue-history files use the existing host storage path and mechanism.
+#### NPU Reboot Cause
+* When the NPU undergoes a reboot the existing reboot-cause workflow for a switch still remains the same for a smartswitch as well.
+* When the NPU reboots the "determine_reboot_cause" fetches the npu reboot-cause and persists the files in "/host/reboot-cause" path.
+* A maximum of ten reboot-cause history entries per dpu will be persisted just like the npu.
+* The "update_reboot_cause" function updates the stateDB with reboot-cause, time, user etc as shown in the schema.
+* The existing "show reboot-cause" and "show reboot-cause history" CLIs will be backward compatible. Please refer to the CLI section.
 
-#### Schema for REBOOT_CAUSE - switch stateDB
+#### Schema for REBOOT_CAUSE of SWITCH on switch stateDB
 ```
   Key: "REBOOT_CAUSE|2023_06_18_14_56_12"
 
   "REBOOT_CAUSE|2023_06_18_14_56_12": {
     "value": {
-      "cause": "REBOOT_CAUSE_HOST_RESET_DPU",
+      "cause": "Unknown",
       "comment": "N/A",
-      "device": "DPU5",
       "time": "2023_06_18_14_56_12",
       "user": "N/A"
     }
-  },
+  }
+
+```
+#### DPU Reboot Cause
+* The smartswitch needs to know the reboot cause for all the DPUs.
+* The NPU hardware should be capable of providing the DPU reboot-cause even when the DPUs are dead.
+* The get_reboot_cause will return the current reboot-cause of the module.
+* For persistent storage of the DPU reboot-cause and reboot-cause-history files use the existing mechanism and host storage path under "/host/reboot-cause/module/dpux".
+* The storage and retrieval of the reboot-cause of the Switch and PDUs are shown in the sequence diagram
+
+<p align="center"><img src="./images/dpu-reboot-seq.svg"></p>
+
+#### Reboot workflow
+* The switch boots up. Determines the NPU reboot cause. 
+* Processes the previously stored NPU and DPU reboot-cause files and history files.
+* A maximum of ten reboot-cause history entries per dpu will be persisted just like the npu.
+* Updates the NPU reboot-cause into the StateDB and the DPU reboot-cause into the ChassisStateDB.
+* The above process is a one-shot event on boot up.
+* The module_db_update function in the NPU-PMON chassisd is an existing function constantly updating the operational status of the DPUs.
+* This function looks for DPU operational status change events and when the DPUs come out of "offline" state, issues "get_reboot_cause" API to the platform.
+* The dpu operational state transition from 'offline' to 'online' guarantees the reboot of a DPU.
+* The platform code will extract the DPU reboot cause from the NPU hardware itself even when the DPU is not reachable.
+* The DPU reboot cause will be mapped to one of the following existing reboot causes and returned back.
+    * REBOOT_CAUSE_POWER_LOSS = "Power Loss"
+    * REBOOT_CAUSE_THERMAL_OVERLOAD_CPU = "Thermal Overload: CPU"
+    * REBOOT_CAUSE_THERMAL_OVERLOAD_ASIC = "Thermal Overload: ASIC"
+    * REBOOT_CAUSE_THERMAL_OVERLOAD_OTHER = "Thermal Overload: Other"
+    * REBOOT_CAUSE_INSUFFICIENT_FAN_SPEED = "Insufficient Fan Speed"
+    * REBOOT_CAUSE_WATCHDOG = "Watchdog"
+    * REBOOT_CAUSE_HARDWARE_OTHER = "Hardware - Other"
+    * REBOOT_CAUSE_HARDWARE_BIOS = "BIOS"
+    * REBOOT_CAUSE_HARDWARE_CPU = "CPU"
+    * REBOOT_CAUSE_HARDWARE_BUTTON = "Push button"
+    * REBOOT_CAUSE_HARDWARE_RESET_FROM_ASIC = "Reset from ASIC"
+    * REBOOT_CAUSE_NON_HARDWARE = "Non-Hardware"
+* When the platform wants to provide additional details to the reboot cause they can append it to the string with a ',' separation as shown below.
+```
+return REBOOT_CAUSE_NON_HARDWARE + ', ' + 'kernel panic'
+```
+* The switch reboot use case will follow the same sequence.
+* The pmon container restart should not affect this sequence as the states are persisted either in the DB or in the file system.
+
+#### Schema for REBOOT_CAUSE of DPUs on switch ChassisStateDB
+```
+  Key: "REBOOT_CAUSE|DPU0|2024_06_06_09_31_18"
+
+  "REBOOT_CAUSE|DPU0|2024_06_06_09_31_18": {
+    "value": {
+      "cause": "Software causes (Reboot)",
+      "comment": "User issued 'reboot' command [User: admin, Time: Thu Jun  6 09:46:43 AM UTC 2024]",
+      "device": "DPU0",
+      "time": "N/A",
+      "user": "N/A"
+    }
+  }
 
 ```
-2. Though the get_oper_status(self) can get the operational status of the DPU Modules, the current implementation only has limited capabilities.
-    * Can only state MODULE_STATUS_FAULT and can't show exactly where in the state progression the DPU failed. This is critical in fault isolation, DPU switchover decision, resiliency and recovery
+#### 2. DPU State
+    * Added supporting fileds such as "time" and "reason" to show exactly where in the state progression the DPU failed. This will be helpful in fault isolation, DPU switchover decision, resiliency and recovery
     * Though this is platform implementation specific, in a multi vendor use case, there has to be a consistent way of storing and accessing the information.
     * Store the state progression (dpu_midplane_link_state, dpu_control_plane_state, dpu_data_plane_state) on the host ChassisStateDB.
     * get_state_info(self) will return an object with the ChassisStateDB data
+    * Two more APIs get_dataplane_state(self) and get_controlplane_state(self) are available to get the dataplane_state and controlplane_state are available to access them individually.
+    * The dpu_midplane_link_state will be monitored and updated by the NPU PMON chassisd.
     * Potential consumers: HA, LB, Switch CLIs, Utils (install/repair images), Life Cycle Manager 
     * Use cases: HA, Debuggability, error recovery (reset, power cycle) and fault management, consolidated view of Switch and DPU state
+
 #### DPU_STATE definition
 dpu_midplane_link_state: up refers to the pcie link between the NPU and DPU is operational. This will be updated by the switch pcied.
 
@@ -490,13 +561,40 @@ dpu_data_plane_state: up  refers to configuration downloaded, the pipeline stage
         ”dpu_data_plane_time": ”timestamp",
         ”dpu_data_plane_reason": ”Pipeline failure",
 ```
-
-3. Each DPU has to store the health data in its local DB and should provide it to the switch.
-* When the "show system-health ..." CLI is executed on the switch, the "UserDefinedChecker" class will collect the data and feed it to the CLI. It is up to the platform on how this is done.  However, for faster access store it in the switch ChassisStateDB.
-* The DPU is a complex hardware, to facilitate debug, a consistent way of storing and accessing the health record of the DPUs is critical in a multi vendor scenario even though it is a platform specific implementation.
-* Both switch and the DPUs will follow to the [SONiC system health monitor HLD](https://github.com/sonic-net/SONiC/blob/ce313db92a694e007a6c5332ce3267ac158290f6/doc/system_health_monitoring/system-health-HLD.md)
+#### 3 DPU Health
+This feature is implemented in two phases.
+#### Phase:1
+* Each DPU has to store the health info locally and should be available on the DPU when the "show system-health ..." CLI is executed on the DPU just like the switch.
+#### Phase:2
+* Each DPU besides storing the health info locally, should also store the DPU health info in the switch ChassisStateDB. The schema for each DPU health info is the same as the switch and also is shown below.
+* When the "show system-health <all/DPUx/SWITCH>" CLI is executed on the switch a consolidated view of the entire system health will be provided.
+* The DPU is a complex hardware. To facilitate debug, a consistent way of storing and accessing the health record of the DPUs is critical in a multi vendor scenario even though it is a platform specific implementation.
+* Both switch and the DPUs will follow the [SONiC system health monitor HLD](https://github.com/sonic-net/SONiC/blob/ce313db92a694e007a6c5332ce3267ac158290f6/doc/system_health_monitoring/system-health-HLD.md)
 * Refer to section 3.4.5 for "show system-health .." CLIs
 
+#### Schema for HEALTH_INFO of DPUs on switch ChassisStateDB
+```
+; Defines information for a system health
+key                     = SYSTEM_HEALTH_INFO|DPUx        ; health information for DPUx
+; field                 = value
+summary                 = STRING                         ; summary status for the DPU
+<item_name>             = STRING                         ; an entry for a service or device
+
+```
+We store items to db only if it is abnormal. Here is an example:
+```
+admin@sonic:~$ redis-cli -n 13 hgetall SYSTEM_HEALTH_INFO
+1) "lldp:lldpmgrd"
+2) "Process 'lldpmgrd' in container 'lldp' is not running"
+3) "summary"
+4) "Not OK"
+```
+If the system status is good, the data in redis is like:
+```
+admin@sonic:~$ redis-cli -n 13 hgetall SYSTEM_HEALTH_INFO
+ 1) "summary"
+ 2) "OK"
+```
 ##### 3.1.5.2 ModuleBase class new APIs
 The DPU ID is used only for indexing purpose.
 
@@ -505,8 +603,7 @@ get_dpu_id(self):
     Retrieves the DPU ID. Returns None for non-smartswitch chassis.
 
     Returns:
-        An integer, indicating the DPU ID. DPU0 returns 1, DPUX returns X+1
-        Returns '0' on switch module
+        An integer, indicating the DPU ID. DPU0 returns 0, DPUX returns X
 ```
 #### Get DPU reboot cause
 def get_reboot_cause(self):
@@ -530,52 +627,17 @@ get_state_info(self):
 ```
 
 #### DPU_HEALTH Use Case
-* The major consumer of this data could be CLIs, fault management, debug, error recovery 
-
-get_health_info(self):
-```
-    Retrieves the dpu health object having the detailed dpu health Fetched from the DPUs
-
-    Returns:
-        An object instance of the dpu health. 
-        Returns None when the module is SWITCH
-    
-    Example:
-    {
-      "led_status": "green",
-
-      "monitoredlists": {
-          "Program": [
-              {"Name": "routeCheck", "Status": "Not OK", "Type": "Program"},
-              // Add more program items here
-          ],
-          "Service": [
-              {"Name": "mgmt-framework", "Status": "Not OK", "Type": "Service"},
-              // Add more service items here
-          ],
-          "Fan": [
-              {"Name": "Fan", "Status": "Not OK", "Type": "Fan"}
-          ],
-          "UserDefined": [
-              // Add user-defined items here
-          ]
-      },
-
-      "ignore_list": [
-          {"Name": "example1", "Status": "OK", "Type": "Type1"},
-          // Add more items to ignore list
-      ]
-    }
-```
+* The major consumer of this data could be CLIs, fault management, debug, error recovery.  There is no platform API for this.
 
 ### 3.2 Thermal management
 * Platform  initializes all sensors
 * Thermalctld fetch CPU temperature, DPU temperature, fan speed, monitor and update the DB
+* The thermal management runs on NPU
 * Thermal manager reads all thermal sensor data, run thermal policy and take policy action Ex. Set fan speed, set alarm, set syslog, set LEDs 
 * Platform collects fan related data such as presence, failure and then applies fan algorithm to set the new fan speed
 * The north bound CLI/Utils/App use DB data to ”show environment”, ”show platform temp” show platform fan”
-* The DPUs will update the ChassisStateDB "TEMPERATURE_INFO" tables through redis client call which in turn will be pushed into the switch StateDB.
 * The existing "TEMPERATURE_INFO" schema will be used to store the values and is shown below for convenience.
+
 #### TEMPERATURE_INFO schema in StateDB
 ```
   "TEMPERATURE_INFO|DPU_0_T": {
@@ -606,6 +668,8 @@ A typical modular chassis includes a midplane-interface to interconnect the Supe
 * By default smartswitch midplane IP address assignment will be done using internal DHCP.
 * Please refer to the [ip-address-assignment document](https://github.com/sonic-net/SONiC/blob/master/doc/smart-switch/ip-address-assigment/smart-switch-ip-address-assignment.md) for IP address assignment between the switch host and the DPUs.
 * The second option is the static IP address assignment.
+* A DPU state change handler will be implemented to monitor PCIe link state change events, DPU control-plane and data-plane state transitions mainly for HA.
+* There will be a separate hld for the DPU state change handler.
 
 ### 3.4 Debug & RMA
 CLI Extensions and Additions
@@ -676,92 +740,106 @@ fantray0    N/A  fantray0.fan      55%       intake     Present        OK  20230
 fantray1    N/A  fantray1.fan      56%       intake     Present        OK  20230728 06:41:17
 ```
 
-#### 3.4.1 Reboot Cause
-* There are two CLIs "show reboot-cause" and "show reboot-cause history" which are applicable to both DPUs and the Switch. However, when executed on the Switch the CLIs provide a consolidated view of reboot cause as shown below.
-* Each DPU will update its reboot cause history in the Switch ChasissStateDB upon boot up. The recent reboot-cause can be derived from that list of reboot-causes.
-* The switch side PMON will copy this into the stateDB so that the existing workflow will not be affected.
-* The get_reboot_cause API will return the current reboot-cause of the module.
-
-#### REBOOT_CAUSE DB schema
-```
-Key: "REBOOT_CAUSE|2023_06_18_14_56_12"
+#### 3.4.1 Reboot Cause CLIs
+* There are two existing CLIs "show reboot-cause" and "show reboot-cause history"
+* These two CLIs are extended to "show reboot-cause all" and "show reboot-cause history \<option\>", where the "option" could be DPUx, all or SWITCH
+* The DPUs will limit the number of history entries to a maximum of ten.
+* The recent reboot-cause can be derived from that list of reboot-causes.
+* Platform hardware should have the DPU reboot-cause available on the NPU side and provided it to the "get_reboot_cause()" API
 
-"REBOOT_CAUSE|2023_06_18_14_56_12": {
-    "value": {
-        "cause": "REBOOT_CAUSE_HOST_RESET_DPU",
-        "comment": "N/A",
-        "device": "DPU5",
-        "time": "2023_06_18_14_56_12",
-        "user": "N/A"
-    }
-}
-```
 #### 3.4.2 Reboot Cause CLIs on the DPUs      <font>**`Executed on the DPU`**</font>
 * The "show reboot-cause" shows the most recent reboot-cause
 * The "show reboot-cause history" shows the reboot-cause history
+* The new cli extensions will not have any effect on the DPUs as shown in the example.
 ```
-root@sonic:~#show reboot-cause
-
-Name                    Cause                       Time                                User    Comment
+root@sonic:~#show reboot-cause
 
-2023_10_02_17_20_46     reboot                      Sun 02 Oct 2023 05:20:46 PM UTC     admin   User issued 'reboot'
+Hardware - Other (NPU side powercycle)
 
-root@sonic:~#show reboot-cause history
+root@sonic:~#show reboot-cause history
 
-Name                    Cause                       Time                                User    Comment
+Name                 Cause                                   Time    User    Comment
+2024_11_12_16_09_41  Hardware - Other (NPU side powercycle)  N/A     N/A     Unknown
+2024_11_12_02_03_12  Hardware - Other (NPU side powercycle)  N/A     N/A     Unknown
 
-2023_10_02_17_20_46     reboot                      Sun 02 Oct 2023 05:20:46 PM UTC     admin   User issued 'reboot'
-2023_10_02_18_10_00     reboot                      Sun 02 Oct 2023 06:10:00 PM UTC     admin   User issued 'reboot'
+root@sonic:~#show reboot-cause all
+root@sonic:~#show reboot-cause history all
+root@sonic:~#show reboot-cause history DPU0
 ```
+
 #### 3.4.3 Reboot Cause CLIs on the Switch      <font>**`Executed on the switch`**</font>
-* The "show reboot-cause" CLI on the switch shows the most recent rebooted device, time and the cause. The could be the NPU or any DPU
-* The "show reboot-cause history" CLI on the switch shows the history of the Switch and all DPUs
-* The "show reboot-cause history module-name" CLI on the switch shows the history of the specified module
+* The "show reboot-cause" CLI on the switch remains the same.
+* The "show reboot-cause all" CLI on the switch shows the recent reboot-cause of the Switch and the DPUs.
+* The "show reboot-cause history" CLI on the switch shows the history of the smartswitch and is the same as any switch.
+* The "show reboot-cause history \<option\>" CLI on the switch shows the history of the specified module depending on the option as show below.
 
-"show reboot-cause history"      <font>**`Executed on the switch`**</font>
 ```
-root@sonic:~#show reboot-cause
+root@sonic:~#show reboot-cause
+
+Power Loss
+
+root@sonic:~#show reboot-cause history
+
+Name                    Cause                       Time                                User    Comment
+-------------------     -------------------         -------------------------------     ------  ------
+2023_10_20_18_52_28     Watchdog:1 expired;         Wed 20 Oct 2023 06:52:28 PM UTC     N/A     N/A
+2023_10_05_18_23_46     reboot                      Wed 05 Oct 2023 06:23:46 PM UTC     user    N/A
+
 
-Device          Name                    Cause                       Time                                User    Comment
+root@sonic:~#show reboot-cause all
 
-switch          2023_10_20_18_52_28     Watchdog:1 expired;         Wed 20 Oct 2023 06:52:28 PM UTC     N/A     N/A
-DPU3            2023_10_03_18_23_46     Watchdog: stage 1 expired;  Mon 03 Oct 2023 06:23:46 PM UTC     N/A     N/A
-DPU2            2023_10_02_17_20_46     reboot                      Sun 02 Oct 2023 05:20:46 PM UTC     admin   User issued 'reboot'
+Device    Name                 Cause                                   Time                             User
+--------  -------------------  --------------------------------------  -------------------------------  ------
+SWITCH    2024_11_12_02_03_08  Power Loss                              N/A                              N/A
+DPU3      2024_11_12_02_06_01  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:06:01 AM UTC 2024  N/A
+DPU2      2024_11_12_02_05_58  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:05:58 AM UTC 2024  N/A
+DPU1      2024_11_12_02_05_55  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:05:55 AM UTC 2024  N/A
+DPU0      2024_11_12_16_08_43  Non-Hardware, Switch rebooted DPU       Tue Nov 12 04:08:43 PM UTC 2024  N/A
 
-root@sonic:~#show reboot-cause history
 
-Device          Name                    Cause                       Time                                User    Comment
+root@sonic:~# show reboot-cause history all
+Device    Name                 Cause                                   Time                             User    Comment
+--------  -------------------  --------------------------------------  -------------------------------  ------  ------------------------------------------------------------------------
+SWITCH    2024_11_12_02_03_08  Power Loss                              N/A                              N/A     Unknown (First boot of SONiC version master.18096-dirty-20241111.203125)
+DPU3      2024_11_12_02_06_01  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:06:01 AM UTC 2024          N/A
+DPU2      2024_11_12_02_05_58  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:05:58 AM UTC 2024          N/A
+DPU1      2024_11_12_02_05_55  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:05:55 AM UTC 2024          N/A
+DPU0      2024_11_12_16_08_43  Non-Hardware, Switch rebooted DPU       Tue Nov 12 04:08:43 PM UTC 2024          N/A
+DPU0      2024_11_12_02_05_52  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:05:52 AM UTC 2024          N/A
 
-switch          2023_10_20_18_52_28     Watchdog:1 expired;         Wed 20 Oct 2023 06:52:28 PM UTC     N/A     N/A
-switch          2023_10_05_18_23_46     reboot                      Wed 05 Oct 2023 06:23:46 PM UTC     user    N/A
-DPU3            2023_10_03_18_23_46     Watchdog: stage 1 expired;  Mon 03 Oct 2023 06:23:46 PM UTC     N/A     N/A
-DPU3            2023_10_02_18_23_46     Host Power-cycle            Sun 02 Oct 2023 06:23:46 PM UTC     N/A     Host lost DPU
-DPU3            2023_10_02_17_23_46     Host Reset DPU              Sun 02 Oct 2023 05:23:46 PM UTC     N/A     N/A
-DPU2            2023_10_02_17_20_46     reboot                      Sun 02 Oct 2023 05:20:46 PM UTC     admin   User issued 'reboot'
 
-"show reboot-cause history module-name"
+show reboot-cause history DPU0
+Device    Name                 Cause                                   Time                             User    Comment
+--------  -------------------  --------------------------------------  -------------------------------  ------  ---------
+DPU0      2024_11_12_16_08_43  Non-Hardware, Switch rebooted DPU       Tue Nov 12 04:08:43 PM UTC 2024          N/A
+DPU0      2024_11_12_02_05_52  Hardware - Other (NPU side powercycle)  Tue Nov 12 02:05:52 AM UTC 2024          N/A
 
-root@sonic:~#show reboot-cause history dpu3
 
-Device      Name                    Cause                           Time                                User    Comment 
-   
-DPU3        2023_10_03_18_23_46     Watchdog: stage 1 expired;      Mon 03 Oct 2023 06:23:46 PM UTC     N/A     N/A
-DPU3        2023_10_02_18_23_46     Host Power-cycle                Sun 02 Oct 2023 06:23:46 PM UTC     N/A     Host lost DPU
-DPU3        2023_10_02_17_23_46     Host Reset DPU                  Sun 02 Oct 2023 05:23:46 PM UTC     N/A     N/A
+root@sonic:~# show reboot-cause history SWITCH
+Device    Name                 Cause         Time    User    Comment
+--------  -------------------  ------------  ------  ------  ------------------------------------------------------------------------
+SWITCH    2024_11_12_02_03_08  Power Loss     N/A    N/A     Unknown (First boot of SONiC version master.18096-dirty-20241111.203125)
 ```
+
 #### 3.4.4 Chassis Module Status
 * The "show chassis modules status" is an existing CLI but extended to include the status of all DPUs and switch. <font>**`Executed on the switch. This CLI is not available on the DPU.`**</font>
 ```
-root@sonic:~#show chassis modules status                                                                                      
-Name        Description         ID         Oper-Status     Admin-Status     Serial
-
-DPU0        SS-DPU0             1           Online          up              SN20240105
-DPU1        SS-DPU1             2           Online          up              SN20240102
-...
-SWITCH      Chassis             0           Online          N/A             FLM27000ER
+root@sonic:~#show chassis modules status
+  Name    Description    Physical-Slot    Oper-Status    Admin-Status    Serial
+------  -------------  ---------------  -------------  --------------  --------
+  DPU0            N/A              N/A        Offline            down       N/A
+  DPU1            N/A              N/A         Online              up       N/A
+  DPU2            N/A              N/A         Online              up       N/A
+  DPU3            N/A              N/A         Online              up       N/A
 ```
+
 #### 3.4.5  System health details
-* The system health summary on NPU should include the DPU health. Extend the existing infrastructure.
+#### Phase:1
+* The system health summary on switch will display only the NPU health
+* The system health summary on DPU will display the DPU health
+
+#### Phase:2
+* The system health summary on switch should include the NPU and DPU health. Extend the existing CLI infrastructure.
 
 show system-health summary \<module-name\>   <font>**`Executed on the switch or DPU - module-name is ignored on the DPUs`**</font>
 ```
@@ -796,27 +874,27 @@ When the idex is "all" shows the detailed state of all DPUs
 Oper-Status definition: 
 Online : All states are up
 Offline: dpu_midplane_link_state is down
-Partial Online: dpu_midplane_link_state is up and dpu_control_plane_state or dpu_data_plane_state is down
+Fault: dpu_midplane_link_state is up and dpu_control_plane_state or dpu_data_plane_state is down
+
+There are two parts to the state detail. 1. The midplane state 2. the dpu states (control plane state, data plane state). The midplane state has to be updated by the switch side pcied. The dpu states will be updated by the DPU (redis client update) on the switch ChassisStateDB. The get_state_info() API in the moduleBase class will fetch the contents from the DB. The show CLI reads the redis table and displays the data.
+root@sonic:~#show system-health DPU all
 
-There are two parts to the state detail. 1. The midplane state 2. the dpu states (booted, control plane state, data plane state). The midplane state has to be updated by the switch side pcied. The dpu states will be updated by the DPU (redis client update) on the switch ChassisStateDB. The get_state_info() API in the moduleBase class will fetch the contents from the DB. The show CLI reads the redis table and displays the data.
-root@sonic:~#show system-health DPU all  
-            
-Name       ID    Oper-Status          State-Detail                   State-Value     Time                               Reason                        
-DPU0       1     Partial Online       dpu_midplane_link_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
-                                      dpu_control_plane_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
-                                      dpu_data_plane_state           down            Wed 20 Oct 2023 06:52:28 PM UTC    Pipeline failure
+Name       Oper-Status          State-Detail                   State-Value     Time                               Reason                        
+DPU0       Fault                dpu_midplane_link_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
+                                dpu_control_plane_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
+                                dpu_data_plane_state           down            Wed 20 Oct 2023 06:52:28 PM UTC    Pipeline failure
 
 
-DPU1       2     Online               dpu_midplane_link_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
-                                      dpu_control_plane_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
-                                      dpu_data_plane_state           up              Wed 20 Oct 2023 06:52:28 PM UTC
+DPU1       Online               dpu_midplane_link_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
+                                dpu_control_plane_state        up              Wed 20 Oct 2023 06:52:28 PM UTC
+                                dpu_data_plane_state           up              Wed 20 Oct 2023 06:52:28 PM UTC
 
 root@sonic:~#show system-health DPU 0
- 
-Name       ID    Oper-Status          State-Detail                   State-Value     Time                               Reason
-DPU0       1     Offline              dpu_midplane_link_state        down            Wed 20 Oct 2023 06:52:28 PM UTC    PCIe link is down
-                                      dpu_control_plane_state        down            Wed 20 Oct 2023 06:52:28 PM UTC
-                                      dpu_data_plane_state           down            Wed 20 Oct 2023 06:52:28 PM UTC
+
+Name       Oper-Status          State-Detail                   State-Value     Time                               Reason
+DPU0       Offline              dpu_midplane_link_state        down            Wed 20 Oct 2023 06:52:28 PM UTC    PCIe link is down
+                                dpu_control_plane_state        down            Wed 20 Oct 2023 06:52:28 PM UTC
+                                dpu_data_plane_state           down            Wed 20 Oct 2023 06:52:28 PM UTC
 ```
 #### System health cli extended further as shown
  * Detailed output from the switch can be obtained with the following CLI
@@ -943,7 +1021,25 @@ CPU                        OK        UserDefine
 DDR                        OK        UserDefine
 ```
 
-show interface status - will show the NPU-DPU interface status also      <font>**`Executed on the switch`**</font>
+show interface status - will show the NPU-DPU dataplane interface status also      <font>**`Executed on the switch`**</font>
+
+The internal DPU ports use "role" type in PORT config to indicate NPU-DPU Data Port Type as shown here. Check the type for "Ethernet224" in the "show interface status" output. This config is part of hwsku.json file.
+```
+{
+    "PORT": {
+        "Ethernet224": {
+            "lanes": "2828,2829,2830,2831",
+            "alias": "dpu-0",
+            "index": "28",
+            "speed": "200000",
+            "subport": "0",
+            "admin_status": "up",
+            "mtu": "9100",
+            "role": "Dpc"
+        },
+    }
+}
+```
 ```
 root@sonic:~# show interfaces status
   Interface                                    Lanes    Speed    MTU    FEC    Alias    Vlan    Oper    Admin    Type       Asym PFC
@@ -954,16 +1050,14 @@ root@sonic:~# show interfaces status
  Ethernet24  2048,2049,2050,2051,2052,2053,2054,2055     400G   9100    N/A     etp3  routed    down       up     N/A           N/A
  Ethernet32  1792,1793,1794,1795,1796,1797,1798,1799     400G   9100    N/A     etp4  routed    down       up     N/A           N/A
  Ethernet40  1800,1801,1802,1803,1804,1805,1806,1807     400G   9100    N/A     etp5  routed    down       up     N/A           N/A
- ...
- ...
-
-### These are internal DPU ports.  Use role type to indicate NPU-DPU Data Port.###
 ...
 ...
-Ethernet192                                   4,5,6,7     200G   9100    N/A   dpu-0  routed    down       up     DPU-NPU Data Port  N/A
-Ethernet200                                   0,1,2,3     200G   9100    N/A   dpu-1  routed    down       up     DPU-NPU Data Port  N/A
-Ethernet208                                 8,9,10,11     200G   9100    N/A   dpu-2  routed    down       up     DPU-NPU Data Port  N/A
-Ethernet216                               12,13,14,15     200G   9100    N/A   dpu-3  routed    down       up     DPU-NPU Data Port  N/A
+...
+...
+Ethernet224                                   4,5,6,7     200G   9100    N/A   dpu-0  routed    down       up     Dpc  N/A
+Ethernet232                                   0,1,2,3     200G   9100    N/A   dpu-1  routed    down       up     Dpc  N/A
+Ethernet240                                 8,9,10,11     200G   9100    N/A   dpu-2  routed    down       up     Dpc  N/A
+Ethernet248                               12,13,14,15     200G   9100    N/A   dpu-3  routed    down       up     Dpc  N/A
 ```
 
 show interface status     <font>**`Executed on the DPU`**</font>
@@ -976,7 +1070,67 @@ root@sonic:/home/admin# show interfaces status
 ### 3.5 Console Management
 The console access to smartswitch needs to support DPU access in addition to the switch.
 * By default the management port should be connected to the switch CPU console
-* Once inside the switch, the DPUs should be accesssible from it. The design workflow for this will be covered in another document.
+* Once inside the switch, the DPUs should be accesssible from it.
+
+#### 3.5.1 Dpu Console Utility
+* Sonic now supports a DPU console utility "dpu-tty.py"
+* The scope of this is limited only to smartswitch paltforms
+* The user can invoke one or more DPU consoles as shown below by invoking the script "dpu-tty.py" with the module name option "-n dpu0"
+
+```
+root@MtFuji:/home/cisco# dpu-tty.py -n dpu0
+picocom v3.1
+
+port is        : /dev/ttyS4
+flowcontrol    : none
+baudrate is    : 115200
+parity is      : none
+databits are   : 8
+stopbits are   : 1
+escape is      : C-a
+local echo is  : no
+noinit is      : no
+noreset is     : no
+hangup is      : no
+nolock is      : no
+send_cmd is    : sz -vv
+receive_cmd is : rz -vv -E
+imap is        : 
+omap is        : 
+emap is        : crcrlf,delbs,
+logfile is     : none
+initstring     : none
+exit_after is  : not set
+exit is        : no
+
+Type [C-a] [C-h] to see available commands
+Terminal ready
+
+sonic login: admin
+Password: 
+
+```
+#### 3.5.2 Dpu Console Configuration
+* The console configuration is provided via the platform.json file as shown
+* This file is responsible for selecting the baud rate and mapping the module name to the underlying TTY device name.
+```
+Sample platform.json configuration
+
+"DPUS": {
+    "dpu0": {
+        "serial-console": {
+            "device": "ttyS4",
+            "baud-rate": "115200"
+        }
+    },
+    "dpu1": {
+        "serial-console": {
+            "device": "ttyS5",
+            "baud-rate": "115200"
+        }
+    }
+},
+```
 
 ### 3.6 Firmware Upgrade
 * The fwutility should remain unchanged, but the vendor plugin should be extended to support the DPU FW upgrade.
@@ -1022,4 +1176,4 @@ Note:
 ```
 
 ## 4.   Test Plan
-In Progress
+[Test Plan](https://github.com/nissampa/sonic-mgmt_dpu_test/blob/dpu_test_plan_draft_pr/docs/testplan/Smartswitch-test-plan.md)