Ejemplo n.º 1
0
func job_verification_function() {
	//
	// Prevent jobs from accidental oversubscription
	//
	const intel_slots, amd_slots = 16, 64

	var modified_p bool = false
	if !jsv.JSV_is_param("pe_name") {
		jsv.JSV_set_param("binding_strategy", "linear_automatic")
		jsv.JSV_set_param("binding_type", "set")
		jsv.JSV_set_param("binding_amount", "1")
		jsv.JSV_set_param("binding_exp_n", "0")
		modified_p = true
	} else {
		hostlist, _ := jsv.JSV_get_param("q_hard")
		hostlist = strings.SplitAfterN(hostlist, "@", 2)[1]

		v, _ := jsv.JSV_get_param("pe_max")
		pe_max, _ := strconv.Atoi(v)

		if strings.EqualFold("@amdhosts", hostlist) {
			if pe_max > 127 {
				jsv.JSV_set_param("R", "y")
				modified_p = true
			}
		}

		if strings.EqualFold("@intelhosts", hostlist) {
			if pe_max > 31 {
				jsv.JSV_set_param("R", "y")
				modified_p = true
			}
		}
	}

	if modified_p {
		// jsv.JSV_show_params()
		jsv.JSV_correct("Job was modified")
	} else {
		jsv.JSV_correct("Job was not modified")
	}

	return
}
Ejemplo n.º 2
0
func job_verification_function() {

	//
	// Prevent jobs from accidental oversubscription
	//

	// NOTE
	// The submit(1) man page has slightly different terminology:
	// "binding_instance" in the man page is "binding_type" in
	//  the jsv library.
	const intel_slots, amd_slots = 16, 64

	var modified_p bool = false

	group, _ := jsv.JSV_get_param("GROUP")

	if !jsv.JSV_is_param("pe_name") {
		// no PE => serial job
		jsv.JSV_set_param("binding_strategy", "linear_automatic")
		jsv.JSV_set_param("binding_amount", "1")
		jsv.JSV_set_param("binding_type", "set")
		jsv.JSV_set_param("binding_exp_n", "0")
		modified_p = true
	} else {
		// parallel job
		if !jsv.JSV_is_param("binding_strategy") {

			pe_name, _ := jsv.JSV_get_param("pe_name")

			var v string
			v, _ = jsv.JSV_get_param("pe_max")
			pe_max, _ := strconv.Atoi(v)

			v, _ = jsv.JSV_get_param("pe_min")
			pe_min, _ := strconv.Atoi(v)

			if strings.EqualFold("shm", pe_name) && (pe_max == pe_min) {
				jsv.JSV_set_param("binding_strategy", "linear_automatic")
				jsv.JSV_set_param("binding_type", "pe")
				jsv.JSV_set_param("binding_amount", strconv.Itoa(pe_max))
				modified_p = true
			} else {

				l_hard, _ := jsv.JSV_get_param("l_hard")
				q_hard, _ := jsv.JSV_get_param("q_hard")

				singleat_re, _ := regexp.Compile("@[a-z]")
				doubleat_re, _ := regexp.Compile("@@")
				intelhost_re, _ := regexp.Compile("^ic[:digit:]{2}n[:digit:]{2}$")
				amdhost_re, _ := regexp.Compile("^ac[:digit:]{2}n[:digit:]{2}$")
				gpuhost_re, _ := regexp.Compile("^gpu[:digit:]{2}$")

				var q string
				var host string
				var hostlist string

				if singleat_re.MatchString(q_hard) {
					// we have a single host
					q = strings.Split(q_hard, "@")[0]
					host = strings.Split(q_hard, "@")[1]
				} else if doubleat_re.MatchString(q_hard) {
					// we have a hostgroup
					q = strings.Split(q_hard, "@")[0]
					hostlist = strings.SplitAfterN(q_hard, "@", 2)[1]
				} else {
					// we have no host specifier
					q = q_hard
				}

				cplx := make(map[string]string)
				l_hard_split := strings.Split(l_hard, ",")
				for _, v := range l_hard_split {
					cplx[strings.Split(v, "=")[0]] = strings.Split(v, "=")[1]
				}

				vendor, ok := cplx["vendor"]

				if !ok {
					// vendor was not requested by job
					if strings.EqualFold("gpu.q", q) || strings.EqualFold("@intelhosts", hostlist) {
						vendor = "intel"
					} else if strings.EqualFold("@amdhosts", hostlist) {
						vendor = "amd"
					} else if len(host) != 0 {
						// specific hosts requested
						if intelhost_re.MatchString(host) || gpuhost_re.MatchString(host) {
							vendor = "intel"
						} else if amdhost_re.MatchString(host) {
							vendor = "amd"
						}
					} else {
						_, ok = cplx["ngpus"]
						if !ok {
							_, ok = cplx["cuda"]
						}

						if ok {
							vendor = "intel"
						} else {
							vendor = "undef"
						}
					}
				}

				// Only specify binding if pe_max == pe_min, i.e. if a fixed
				// number of slots is requested

				if !strings.EqualFold("undef", vendor) && pe_max == pe_min {
					jsv.JSV_set_param("binding_strategy", "linear_automatic")
					jsv.JSV_set_param("binding_type", "pe")

					// Don't do reservation for high-throughput groups
					if !strings.EqualFold("rosenGrp", group) {
						if strings.EqualFold("intel", vendor) {
							if pe_max < intel_slots {
								jsv.JSV_set_param("binding_amount", strconv.Itoa(pe_max))
							} else {
								jsv.JSV_set_param("binding_amount", strconv.Itoa(intel_slots))
							}

							if pe_max > 31 {
								jsv.JSV_set_param("R", "y")
							}
						} else if strings.EqualFold("amd", vendor) {
							if pe_max < amd_slots {
								jsv.JSV_set_param("binding_amount", strconv.Itoa(pe_max))
							} else {
								jsv.JSV_set_param("binding_amount", strconv.Itoa(amd_slots))

								if pe_max > 127 {
									jsv.JSV_set_param("R", "y")
								}
							}
						}
					}

					modified_p = true
				}
			}
		}
	}

	// XXX print out debugging info - comment out for production
	jsv.JSV_show_params()

	if modified_p {
		jsv.JSV_correct("Job was modified")
	} else {
		jsv.JSV_correct("Job was not modified")
	}

	return
}