lenovo_fix.py 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838
  1. #!/usr/bin/env python3
  2. from __future__ import print_function
  3. import argparse
  4. import configparser
  5. import glob
  6. import gzip
  7. import os
  8. import re
  9. import struct
  10. import subprocess
  11. import sys
  12. from collections import defaultdict
  13. from datetime import datetime
  14. from errno import EACCES, EPERM
  15. from multiprocessing import cpu_count
  16. from platform import uname
  17. from threading import Event, Thread
  18. from time import time
  19. import dbus
  20. from dbus.mainloop.glib import DBusGMainLoop
  21. from gi.repository import GLib
  22. from mmio import MMIO, MMIOError
  23. DEFAULT_SYSFS_POWER_PATH = '/sys/class/power_supply/AC*/online'
  24. VOLTAGE_PLANES = {'CORE': 0, 'GPU': 1, 'CACHE': 2, 'UNCORE': 3, 'ANALOGIO': 4}
  25. CURRENT_PLANES = {'CORE': 0, 'GPU': 1, 'CACHE': 2}
  26. TRIP_TEMP_RANGE = [40, 97]
  27. UNDERVOLT_KEYS = ('UNDERVOLT', 'UNDERVOLT.AC', 'UNDERVOLT.BATTERY')
  28. ICCMAX_KEYS = ('ICCMAX', 'ICCMAX.AC', 'ICCMAX.BATTERY')
  29. power = {'source': None, 'method': 'polling'}
  30. HWP_VALUE = 0x20
  31. HWP_INTERVAL = 60
  32. platform_info_bits = {
  33. 'maximum_non_turbo_ratio': [8, 15],
  34. 'maximum_efficiency_ratio': [40, 47],
  35. 'minimum_operating_ratio': [48, 55],
  36. 'feature_ppin_cap': [23, 23],
  37. 'feature_programmable_turbo_ratio': [28, 28],
  38. 'feature_programmable_tdp_limit': [29, 29],
  39. 'number_of_additional_tdp_profiles': [33, 34],
  40. 'feature_programmable_temperature_target': [30, 30],
  41. 'feature_low_power_mode': [32, 32],
  42. }
  43. thermal_status_bits = {
  44. 'thermal_limit_status': [0, 0],
  45. 'thermal_limit_log': [1, 1],
  46. 'prochot_or_forcepr_status': [2, 2],
  47. 'prochot_or_forcepr_log': [3, 3],
  48. 'crit_temp_status': [4, 4],
  49. 'crit_temp_log': [5, 5],
  50. 'thermal_threshold1_status': [6, 6],
  51. 'thermal_threshold1_log': [7, 7],
  52. 'thermal_threshold2_status': [8, 8],
  53. 'thermal_threshold2_log': [9, 9],
  54. 'power_limit_status': [10, 10],
  55. 'power_limit_log': [11, 11],
  56. 'current_limit_status': [12, 12],
  57. 'current_limit_log': [13, 13],
  58. 'cross_domain_limit_status': [14, 14],
  59. 'cross_domain_limit_log': [15, 15],
  60. 'cpu_temp': [16, 22],
  61. 'temp_resolution': [27, 30],
  62. 'reading_valid': [31, 31],
  63. }
  64. supported_cpus = {
  65. 'Haswell': (0x3C, 0x3F, 0x45, 0x46),
  66. 'Broadwell': (0x3D, 0x47, 0x4F, 0x56),
  67. 'Skylake': (0x4E, 0x55),
  68. 'Skylake-S': (0x5E,),
  69. 'Ice Lake': (0x7E,),
  70. 'Kaby Lake (R)': (0x8E, 0x9E),
  71. 'Coffee Lake': (0x9E,),
  72. 'Cannon Lake': (0x66,),
  73. }
  74. class bcolors:
  75. YELLOW = '\033[93m'
  76. GREEN = '\033[92m'
  77. RED = '\033[91m'
  78. RESET = '\033[0m'
  79. BOLD = '\033[1m'
  80. OK = bcolors.GREEN + bcolors.BOLD + 'OK' + bcolors.RESET
  81. ERR = bcolors.RED + bcolors.BOLD + 'ERR' + bcolors.RESET
  82. LIM = bcolors.YELLOW + bcolors.BOLD + 'LIM' + bcolors.RESET
  83. log_history = set()
  84. def log(msg, oneshot=False, end='\n'):
  85. outfile = args.log if args.log else sys.stdout
  86. if msg.strip() not in log_history or oneshot is False:
  87. tstamp = datetime.now().strftime('%Y-%m-%d %H:%M:%S.%f')[:-3]
  88. full_msg = '{:s}: {:s}'.format(tstamp, msg) if args.log else msg
  89. print(full_msg, file=outfile, end=end)
  90. log_history.add(msg.strip())
  91. def fatal(msg, code=1, end='\n'):
  92. outfile = args.log if args.log else sys.stderr
  93. tstamp = datetime.now().strftime('%Y-%m-%d %H:%M:%S.%f')[:-3]
  94. full_msg = '{:s}: [E] {:s}'.format(tstamp, msg) if args.log else '[E] {:s}'.format(msg)
  95. print(full_msg, file=outfile, end=end)
  96. sys.exit(code)
  97. def warning(msg, oneshot=True, end='\n'):
  98. outfile = args.log if args.log else sys.stderr
  99. if msg.strip() not in log_history or oneshot is False:
  100. tstamp = datetime.now().strftime('%Y-%m-%d %H:%M:%S.%f')[:-3]
  101. full_msg = '{:s}: [W] {:s}'.format(tstamp, msg) if args.log else '[W] {:s}'.format(msg)
  102. print(full_msg, file=outfile, end=end)
  103. log_history.add(msg.strip())
  104. def writemsr(msr, val):
  105. msr_list = ['/dev/cpu/{:d}/msr'.format(x) for x in range(cpu_count())]
  106. if not os.path.exists(msr_list[0]):
  107. try:
  108. subprocess.check_call(('modprobe', 'msr'))
  109. except subprocess.CalledProcessError:
  110. fatal('Unable to load the msr module.')
  111. try:
  112. for addr in msr_list:
  113. f = os.open(addr, os.O_WRONLY)
  114. os.lseek(f, msr, os.SEEK_SET)
  115. os.write(f, struct.pack('Q', val))
  116. os.close(f)
  117. except (IOError, OSError) as e:
  118. if e.errno == EPERM or e.errno == EACCES:
  119. fatal(
  120. 'Unable to write to MSR. Try to disable Secure Boot '
  121. 'and check if your kernel does not restrict access to MSR.'
  122. )
  123. else:
  124. raise e
  125. # returns the value between from_bit and to_bit as unsigned long
  126. def readmsr(msr, from_bit=0, to_bit=63, cpu=None, flatten=False):
  127. assert cpu is None or cpu in range(cpu_count())
  128. if from_bit > to_bit:
  129. fatal('Wrong readmsr bit params')
  130. msr_list = ['/dev/cpu/{:d}/msr'.format(x) for x in range(cpu_count())]
  131. if not os.path.exists(msr_list[0]):
  132. try:
  133. subprocess.check_call(('modprobe', 'msr'))
  134. except subprocess.CalledProcessError:
  135. fatal('Unable to load the msr module.')
  136. try:
  137. output = []
  138. for addr in msr_list:
  139. f = os.open(addr, os.O_RDONLY)
  140. os.lseek(f, msr, os.SEEK_SET)
  141. val = struct.unpack('Q', os.read(f, 8))[0]
  142. os.close(f)
  143. output.append(get_value_for_bits(val, from_bit, to_bit))
  144. if flatten:
  145. return output[0] if len(set(output)) == 1 else output
  146. return output[cpu] if cpu is not None else output
  147. except (IOError, OSError) as e:
  148. if e.errno == EPERM or e.errno == EACCES:
  149. fatal('Unable to read from MSR. Try to disable Secure Boot.')
  150. else:
  151. raise e
  152. def get_value_for_bits(val, from_bit=0, to_bit=63):
  153. mask = sum(2 ** x for x in range(from_bit, to_bit + 1))
  154. return (val & mask) >> from_bit
  155. def is_on_battery(config):
  156. try:
  157. for path in glob.glob(config.get('GENERAL', 'Sysfs_Power_Path', fallback=DEFAULT_SYSFS_POWER_PATH)):
  158. with open(path) as f:
  159. return not bool(int(f.read()))
  160. raise
  161. except:
  162. warning('No valid Sysfs_Power_Path found! Trying upower method #1')
  163. try:
  164. out = subprocess.check_output(('upower', '-i', '/org/freedesktop/UPower/devices/line_power_AC'))
  165. res = re.search(rb'online:\s+(yes|no)', out).group(1).decode().strip()
  166. if res == 'yes':
  167. return False
  168. elif res == 'no':
  169. return True
  170. raise
  171. except:
  172. warning('Trying upower method #2')
  173. try:
  174. out = subprocess.check_output(('upower', '-i', '/org/freedesktop/UPower/devices/battery_BAT0'))
  175. res = re.search(rb'state:\s+(.+)', out).group(1).decode().strip()
  176. if res == 'discharging':
  177. return True
  178. elif res in ('fully-charged', 'charging'):
  179. return False
  180. except:
  181. pass
  182. warning('No valid power detection methods found. Assuming that the system is running on battery power.')
  183. return True
  184. def get_cpu_platform_info():
  185. features_msr_value = readmsr(0xCE, cpu=0)
  186. cpu_platform_info = {}
  187. for key, value in platform_info_bits.items():
  188. cpu_platform_info[key] = int(get_value_for_bits(features_msr_value, value[0], value[1]))
  189. return cpu_platform_info
  190. def get_reset_thermal_status():
  191. # read thermal status
  192. thermal_status_msr_value = readmsr(0x19C)
  193. thermal_status = []
  194. for core in range(cpu_count()):
  195. thermal_status_core = {}
  196. for key, value in thermal_status_bits.items():
  197. thermal_status_core[key] = int(get_value_for_bits(thermal_status_msr_value[core], value[0], value[1]))
  198. thermal_status.append(thermal_status_core)
  199. # reset log bits
  200. writemsr(0x19C, 0)
  201. return thermal_status
  202. def get_time_unit():
  203. # 0.000977 is the time unit of my CPU
  204. # TODO formula might be different for other CPUs
  205. return 1.0 / 2 ** readmsr(0x606, 16, 19, cpu=0)
  206. def get_power_unit():
  207. # 0.125 is the power unit of my CPU
  208. # TODO formula might be different for other CPUs
  209. return 1.0 / 2 ** readmsr(0x606, 0, 3, cpu=0)
  210. def get_critical_temp():
  211. # the critical temperature for my CPU is 100 'C
  212. return readmsr(0x1A2, 16, 23, cpu=0)
  213. def get_cur_pkg_power_limits():
  214. value = readmsr(0x610, 0, 55, flatten=True)
  215. return {
  216. 'PL1': get_value_for_bits(value, 0, 14),
  217. 'TW1': get_value_for_bits(value, 17, 23),
  218. 'PL2': get_value_for_bits(value, 32, 46),
  219. 'TW2': get_value_for_bits(value, 49, 55),
  220. }
  221. def calc_time_window_vars(t):
  222. time_unit = get_time_unit()
  223. for Y in range(2 ** 5):
  224. for Z in range(2 ** 2):
  225. if t <= (2 ** Y) * (1.0 + Z / 4.0) * time_unit:
  226. return (Y, Z)
  227. raise ValueError('Unable to find a good combination!')
  228. def calc_undervolt_msr(plane, offset):
  229. """Return the value to be written in the MSR 150h for setting the given
  230. offset voltage (in mV) to the given voltage plane.
  231. """
  232. assert offset <= 0
  233. assert plane in VOLTAGE_PLANES
  234. offset = int(round(offset * 1.024))
  235. offset = 0xFFE00000 & ((offset & 0xFFF) << 21)
  236. return 0x8000001100000000 | (VOLTAGE_PLANES[plane] << 40) | offset
  237. def calc_undervolt_mv(msr_value):
  238. """Return the offset voltage (in mV) from the given raw MSR 150h value.
  239. """
  240. offset = (msr_value & 0xFFE00000) >> 21
  241. offset = offset if offset <= 0x400 else -(0x800 - offset)
  242. return int(round(offset / 1.024))
  243. def get_undervolt(plane=None, convert=False):
  244. planes = [plane] if plane in VOLTAGE_PLANES else VOLTAGE_PLANES
  245. out = {}
  246. for plane in planes:
  247. writemsr(0x150, 0x8000001000000000 | (VOLTAGE_PLANES[plane] << 40))
  248. read_value = readmsr(0x150, flatten=True) & 0xFFFFFFFF
  249. out[plane] = calc_undervolt_mv(read_value) if convert else read_value
  250. return out
  251. def undervolt(config):
  252. for plane in VOLTAGE_PLANES:
  253. write_offset_mv = config.getfloat(
  254. 'UNDERVOLT.{:s}'.format(power['source']), plane, fallback=config.getfloat('UNDERVOLT', plane, fallback=0.0)
  255. )
  256. write_value = calc_undervolt_msr(plane, write_offset_mv)
  257. writemsr(0x150, write_value)
  258. if args.debug:
  259. write_value &= 0xFFFFFFFF
  260. read_value = get_undervolt(plane)[plane]
  261. read_offset_mv = calc_undervolt_mv(read_value)
  262. match = OK if write_value == read_value else ERR
  263. log(
  264. '[D] Undervolt plane {:s} - write {:.0f} mV ({:#x}) - read {:.0f} mV ({:#x}) - match {}'.format(
  265. plane, write_offset_mv, write_value, read_offset_mv, read_value, match
  266. )
  267. )
  268. def calc_icc_max_msr(plane, current):
  269. """Return the value to be written in the MSR 150h for setting the given
  270. IccMax (in A) to the given current plane.
  271. """
  272. assert 0 < current <= 0x3FF
  273. assert plane in CURRENT_PLANES
  274. current = int(round(current * 4))
  275. return 0x8000001700000000 | (CURRENT_PLANES[plane] << 40) | current
  276. def calc_icc_max_amp(msr_value):
  277. """Return the max current (in A) from the given raw MSR 150h value.
  278. """
  279. return (msr_value & 0x3FF) / 4.0
  280. def get_icc_max(plane=None, convert=False):
  281. planes = [plane] if plane in CURRENT_PLANES else CURRENT_PLANES
  282. out = {}
  283. for plane in planes:
  284. writemsr(0x150, 0x8000001600000000 | (CURRENT_PLANES[plane] << 40))
  285. read_value = readmsr(0x150, flatten=True) & 0x3FF
  286. out[plane] = calc_icc_max_amp(read_value) if convert else read_value
  287. return out
  288. def set_icc_max(config):
  289. for plane in CURRENT_PLANES:
  290. try:
  291. write_current_amp = config.getfloat(
  292. 'ICCMAX.{:s}'.format(power['source']), plane, fallback=config.getfloat('ICCMAX', plane, fallback=-1.0)
  293. )
  294. if write_current_amp > 0:
  295. write_value = calc_icc_max_msr(plane, write_current_amp)
  296. writemsr(0x150, write_value)
  297. if args.debug:
  298. write_value &= 0x3FF
  299. read_value = get_icc_max(plane)[plane]
  300. read_current_A = calc_icc_max_amp(read_value)
  301. match = OK if write_value == read_value else ERR
  302. log(
  303. '[D] IccMax plane {:s} - write {:.2f} A ({:#x}) - read {:.2f} A ({:#x}) - match {}'.format(
  304. plane, write_current_amp, write_value, read_current_A, read_value, match
  305. )
  306. )
  307. except (configparser.NoSectionError, configparser.NoOptionError):
  308. pass
  309. def load_config():
  310. config = configparser.ConfigParser()
  311. config.read(args.config)
  312. # config values sanity check
  313. for power_source in ('AC', 'BATTERY'):
  314. for option in ('Update_Rate_s', 'PL1_Tdp_W', 'PL1_Duration_s', 'PL2_Tdp_W', 'PL2_Duration_S'):
  315. value = config.getfloat(power_source, option, fallback=None)
  316. if value is not None:
  317. value = config.set(power_source, option, str(max(0.001, value)))
  318. elif option == 'Update_Rate_s':
  319. fatal('The mandatory "Update_Rate_s" parameter is missing.')
  320. for option in ('Disable_BDPROCHOT'):
  321. value = config.boolean(power_source, option, fallback=None)
  322. if value is None:
  323. value = config.set(power_source, option, 0)
  324. trip_temp = config.getfloat(power_source, 'Trip_Temp_C', fallback=None)
  325. if trip_temp is not None:
  326. valid_trip_temp = min(TRIP_TEMP_RANGE[1], max(TRIP_TEMP_RANGE[0], trip_temp))
  327. if trip_temp != valid_trip_temp:
  328. config.set(power_source, 'Trip_Temp_C', str(valid_trip_temp))
  329. log(
  330. '[!] Overriding invalid "Trip_Temp_C" value in "{:s}": {:.1f} -> {:.1f}'.format(
  331. power_source, trip_temp, valid_trip_temp
  332. )
  333. )
  334. # fix any invalid value (ie. > 0) in the undervolt settings
  335. for key in UNDERVOLT_KEYS:
  336. for plane in VOLTAGE_PLANES:
  337. if key in config:
  338. value = config.getfloat(key, plane)
  339. valid_value = min(0, value)
  340. if value != valid_value:
  341. config.set(key, plane, str(valid_value))
  342. log(
  343. '[!] Overriding invalid "{:s}" value in "{:s}" voltage plane: {:.0f} -> {:.0f}'.format(
  344. key, plane, value, valid_value
  345. )
  346. )
  347. # handle the case where only one of UNDERVOLT.AC, UNDERVOLT.BATTERY keys exists
  348. # by forcing the other key to all zeros (ie. no undervolt)
  349. if any(key in config for key in UNDERVOLT_KEYS[1:]):
  350. for key in UNDERVOLT_KEYS[1:]:
  351. if key not in config:
  352. config.add_section(key)
  353. for plane in VOLTAGE_PLANES:
  354. value = config.getfloat(key, plane, fallback=0.0)
  355. config.set(key, plane, str(value))
  356. # Check for CORE/CACHE values mismatch
  357. for key in UNDERVOLT_KEYS:
  358. if key in config:
  359. if config.getfloat(key, 'CORE', fallback=0) != config.getfloat(key, 'CACHE', fallback=0):
  360. warning('On Skylake and newer CPUs CORE and CACHE values should match!')
  361. break
  362. iccmax_enabled = False
  363. # check for invalid values (ie. <= 0 or > 0x3FF) in the IccMax settings
  364. for key in ICCMAX_KEYS:
  365. for plane in CURRENT_PLANES:
  366. if key in config:
  367. try:
  368. value = config.getfloat(key, plane)
  369. if value <= 0 or value >= 0x3FF:
  370. raise ValueError
  371. iccmax_enabled = True
  372. except ValueError:
  373. warning('Invalid value for {:s} in {:s}'.format(plane, key), oneshot=False)
  374. config.remove_option(key, plane)
  375. except configparser.NoOptionError:
  376. pass
  377. if iccmax_enabled:
  378. warning('Warning! Raising IccMax above design limits can damage your system!')
  379. return config
  380. def calc_reg_values(platform_info, config):
  381. regs = defaultdict(dict)
  382. for power_source in ('AC', 'BATTERY'):
  383. if platform_info['feature_programmable_temperature_target'] != 1:
  384. warning("Setting temperature target is not supported by this CPU")
  385. else:
  386. # the critical temperature for my CPU is 100 'C
  387. critical_temp = get_critical_temp()
  388. # update the allowed temp range to keep at least 3 'C from the CPU critical temperature
  389. global TRIP_TEMP_RANGE
  390. TRIP_TEMP_RANGE[1] = min(TRIP_TEMP_RANGE[1], critical_temp - 3)
  391. Trip_Temp_C = config.getfloat(power_source, 'Trip_Temp_C', fallback=None)
  392. if Trip_Temp_C is not None:
  393. trip_offset = int(round(critical_temp - Trip_Temp_C))
  394. regs[power_source]['MSR_TEMPERATURE_TARGET'] = trip_offset << 24
  395. else:
  396. log('[I] {:s} trip temperature is disabled in config.'.format(power_source))
  397. power_unit = get_power_unit()
  398. PL1_Tdp_W = config.getfloat(power_source, 'PL1_Tdp_W', fallback=None)
  399. PL1_Duration_s = config.getfloat(power_source, 'PL1_Duration_s', fallback=None)
  400. PL2_Tdp_W = config.getfloat(power_source, 'PL2_Tdp_W', fallback=None)
  401. PL2_Duration_s = config.getfloat(power_source, 'PL2_Duration_s', fallback=None)
  402. if (PL1_Tdp_W, PL1_Duration_s, PL2_Tdp_W, PL2_Duration_s).count(None) < 4:
  403. cur_pkg_power_limits = get_cur_pkg_power_limits()
  404. if PL1_Tdp_W is None:
  405. PL1 = cur_pkg_power_limits['PL1']
  406. log('[I] {:s} PL1_Tdp_W disabled in config.'.format(power_source))
  407. else:
  408. PL1 = int(round(PL1_Tdp_W / power_unit))
  409. if PL1_Duration_s is None:
  410. TW1 = cur_pkg_power_limits['TW1']
  411. log('[I] {:s} PL1_Duration_s disabled in config.'.format(power_source))
  412. else:
  413. Y, Z = calc_time_window_vars(PL1_Duration_s)
  414. TW1 = Y | (Z << 5)
  415. if PL2_Tdp_W is None:
  416. PL2 = cur_pkg_power_limits['PL2']
  417. log('[I] {:s} PL2_Tdp_W disabled in config.'.format(power_source))
  418. else:
  419. PL2 = int(round(PL2_Tdp_W / power_unit))
  420. if PL2_Duration_s is None:
  421. TW2 = cur_pkg_power_limits['TW2']
  422. log('[I] {:s} PL2_Duration_s disabled in config.'.format(power_source))
  423. else:
  424. Y, Z = calc_time_window_vars(PL2_Duration_s)
  425. TW2 = Y | (Z << 5)
  426. regs[power_source]['MSR_PKG_POWER_LIMIT'] = (
  427. PL1 | (1 << 15) | (1 << 16) | (TW1 << 17) | (PL2 << 32) | (1 << 47) | (TW2 << 49)
  428. )
  429. else:
  430. log('[I] {:s} package power limits are disabled in config.'.format(power_source))
  431. # cTDP
  432. c_tdp_target_value = config.getint(power_source, 'cTDP', fallback=None)
  433. if c_tdp_target_value is not None:
  434. if platform_info['feature_programmable_tdp_limit'] != 1:
  435. log("[W] cTDP setting not supported by this CPU")
  436. elif platform_info['number_of_additional_tdp_profiles'] < c_tdp_target_value:
  437. log("[W] the configured cTDP profile is not supported by this CPU")
  438. else:
  439. valid_c_tdp_target_value = max(0, c_tdp_target_value)
  440. regs[power_source]['MSR_CONFIG_TDP_CONTROL'] = valid_c_tdp_target_value
  441. return regs
  442. def set_hwp():
  443. # set HWP energy performance preference
  444. cur_val = readmsr(0x774, cpu=0)
  445. new_val = (cur_val & 0xFFFFFFFF00FFFFFF) | (HWP_VALUE << 24)
  446. writemsr(0x774, new_val)
  447. if args.debug:
  448. read_value = readmsr(0x774, from_bit=24, to_bit=31)[0]
  449. match = OK if HWP_VALUE == read_value else ERR
  450. log('[D] HWP - write "{:#02x}" - read "{:#02x}" - match {}'.format(HWP_VALUE, read_value, match))
  451. def power_thread(config, regs, exit_event):
  452. try:
  453. mchbar_mmio = MMIO(0xFED159A0, 8)
  454. except MMIOError:
  455. warning('Unable to open /dev/mem. TDP override might not work correctly.')
  456. warning('Try to disable Secure Boot and/or enable CONFIG_DEVMEM in kernel config.')
  457. mchbar_mmio = None
  458. next_hwp_write = 0
  459. while not exit_event.is_set():
  460. # log thermal status
  461. if args.debug:
  462. thermal_status = get_reset_thermal_status()
  463. for index, core_thermal_status in enumerate(thermal_status):
  464. for key, value in core_thermal_status.items():
  465. log('[D] core {} thermal status: {} = {}'.format(index, key.replace("_", " "), value))
  466. # switch back to sysfs polling
  467. if power['method'] == 'polling':
  468. power['source'] = 'BATTERY' if is_on_battery(config) else 'AC'
  469. # set temperature trip point
  470. if 'MSR_TEMPERATURE_TARGET' in regs[power['source']]:
  471. write_value = regs[power['source']]['MSR_TEMPERATURE_TARGET']
  472. writemsr(0x1A2, write_value)
  473. if args.debug:
  474. read_value = readmsr(0x1A2, 24, 29, flatten=True)
  475. match = OK if write_value >> 24 == read_value else ERR
  476. log(
  477. '[D] TEMPERATURE_TARGET - write {:#x} - read {:#x} - match {}'.format(
  478. write_value >> 24, read_value, match
  479. )
  480. )
  481. # set cTDP
  482. if 'MSR_CONFIG_TDP_CONTROL' in regs[power['source']]:
  483. write_value = regs[power['source']]['MSR_CONFIG_TDP_CONTROL']
  484. writemsr(0x64B, write_value)
  485. if args.debug:
  486. read_value = readmsr(0x64B, 0, 1, flatten=True)
  487. match = OK if write_value == read_value else ERR
  488. log(
  489. '[D] CONFIG_TDP_CONTROL - write {:#x} - read {:#x} - match {}'.format(
  490. write_value, read_value, match
  491. )
  492. )
  493. # set PL1/2 on MSR
  494. write_value = regs[power['source']]['MSR_PKG_POWER_LIMIT']
  495. writemsr(0x610, write_value)
  496. if args.debug:
  497. read_value = readmsr(0x610, 0, 55, flatten=True)
  498. match = OK if write_value == read_value else ERR
  499. log(
  500. '[D] MSR PACKAGE_POWER_LIMIT - write {:#x} - read {:#x} - match {}'.format(
  501. write_value, read_value, match
  502. )
  503. )
  504. if mchbar_mmio is not None:
  505. # set MCHBAR register to the same PL1/2 values
  506. mchbar_mmio.write32(0, write_value & 0xFFFFFFFF)
  507. mchbar_mmio.write32(4, write_value >> 32)
  508. if args.debug:
  509. read_value = mchbar_mmio.read32(0) | (mchbar_mmio.read32(4) << 32)
  510. match = OK if write_value == read_value else ERR
  511. log(
  512. '[D] MCHBAR PACKAGE_POWER_LIMIT - write {:#x} - read {:#x} - match {}'.format(
  513. write_value, read_value, match
  514. )
  515. )
  516. wait_t = config.getfloat(power['source'], 'Update_Rate_s')
  517. enable_hwp_mode = config.getboolean('AC', 'HWP_Mode', fallback=False)
  518. # set HWP less frequently. Just to be safe since (e.g.) TLP might reset this value
  519. if (
  520. enable_hwp_mode
  521. and next_hwp_write <= time()
  522. and (
  523. (power['method'] == 'dbus' and power['source'] == 'AC')
  524. or (power['method'] == 'polling' and not is_on_battery(config))
  525. )
  526. ):
  527. set_hwp()
  528. next_hwp_write = time() + HWP_INTERVAL
  529. else:
  530. exit_event.wait(wait_t)
  531. def check_kernel():
  532. if os.geteuid() != 0:
  533. fatal('No root no party. Try again with sudo.')
  534. kernel_config = None
  535. try:
  536. with open(os.path.join('/boot', 'config-{:s}'.format(uname()[2]))) as f:
  537. kernel_config = f.read()
  538. except IOError:
  539. config_gz_path = os.path.join('/proc', 'config.gz')
  540. try:
  541. if not os.path.isfile(config_gz_path):
  542. subprocess.check_call(('modprobe', 'configs'))
  543. with gzip.open(config_gz_path) as f:
  544. kernel_config = f.read().decode()
  545. except (subprocess.CalledProcessError, IOError):
  546. pass
  547. if kernel_config is None:
  548. log('[W] Unable to obtain and validate kernel config.')
  549. return
  550. elif not re.search('CONFIG_DEVMEM=y', kernel_config):
  551. warning('Bad kernel config: you need CONFIG_DEVMEM=y.')
  552. if not re.search('CONFIG_X86_MSR=(y|m)', kernel_config):
  553. fatal('Bad kernel config: you need CONFIG_X86_MSR builtin or as module.')
  554. def check_cpu():
  555. try:
  556. with open('/proc/cpuinfo') as f:
  557. cpuinfo = {}
  558. for row in f.readlines():
  559. try:
  560. key, value = map(lambda x: x.strip(), row.split(':'))
  561. if key == 'processor' and value == '1':
  562. break
  563. try:
  564. cpuinfo[key] = int(value, 0)
  565. except ValueError:
  566. cpuinfo[key] = value
  567. except ValueError:
  568. pass
  569. if cpuinfo['vendor_id'] != 'GenuineIntel':
  570. fatal('This tool is designed for Intel CPUs only.')
  571. cpu_model = None
  572. for model in supported_cpus:
  573. if cpuinfo['model'] in supported_cpus[model]:
  574. cpu_model = model
  575. break
  576. if cpuinfo['cpu family'] != 6 or cpu_model is None:
  577. fatal('Your CPU model is not supported.')
  578. log('[I] Detected CPU architecture: Intel {:s}'.format(cpu_model))
  579. except:
  580. fatal('Unable to identify CPU model.')
  581. def monitor(exit_event, wait):
  582. IA32_THERM_STATUS = 0x19C
  583. IA32_PERF_STATUS = 0x198
  584. MSR_RAPL_POWER_UNIT = 0x606
  585. MSR_INTEL_PKG_ENERGY_STATUS = 0x611
  586. MSR_PP1_ENERGY_STATUS = 0x641
  587. MSR_DRAM_ENERGY_STATUS = 0x619
  588. wait = max(0.1, wait)
  589. rapl_power_unit = 0.5 ** readmsr(MSR_RAPL_POWER_UNIT, from_bit=8, to_bit=12, cpu=0)
  590. power_plane_msr = {
  591. 'Package': MSR_INTEL_PKG_ENERGY_STATUS,
  592. 'Graphics': MSR_PP1_ENERGY_STATUS,
  593. 'DRAM': MSR_DRAM_ENERGY_STATUS,
  594. }
  595. prev_energy = {
  596. 'Package': (readmsr(MSR_INTEL_PKG_ENERGY_STATUS, cpu=0) * rapl_power_unit, time()),
  597. 'Graphics': (readmsr(MSR_PP1_ENERGY_STATUS, cpu=0) * rapl_power_unit, time()),
  598. 'DRAM': (readmsr(MSR_DRAM_ENERGY_STATUS, cpu=0) * rapl_power_unit, time()),
  599. }
  600. undervolt_values = get_undervolt(convert=True)
  601. undervolt_output = ' | '.join('{:s}: {:.2f} mV'.format(plane, undervolt_values[plane]) for plane in VOLTAGE_PLANES)
  602. log('[D] Undervolt offsets: {:s}'.format(undervolt_output))
  603. iccmax_values = get_icc_max(convert=True)
  604. iccmax_output = ' | '.join('{:s}: {:.2f} A'.format(plane, iccmax_values[plane]) for plane in CURRENT_PLANES)
  605. log('[D] IccMax: {:s}'.format(iccmax_output))
  606. log('[D] Realtime monitoring of throttling causes:\n')
  607. while not exit_event.is_set():
  608. value = readmsr(IA32_THERM_STATUS, from_bit=0, to_bit=15, cpu=0)
  609. offsets = {'Thermal': 0, 'Power': 10, 'Current': 12, 'Cross-domain (e.g. GPU)': 14}
  610. output = ('{:s}: {:s}'.format(cause, LIM if bool((value >> offsets[cause]) & 1) else OK) for cause in offsets)
  611. # ugly code, just testing...
  612. vcore = readmsr(IA32_PERF_STATUS, from_bit=32, to_bit=47, cpu=0) / (2.0 ** 13) * 1000
  613. stats2 = {'VCore': '{:.0f} mV'.format(vcore)}
  614. for power_plane in ('Package', 'Graphics', 'DRAM'):
  615. energy_j = readmsr(power_plane_msr[power_plane], cpu=0) * rapl_power_unit
  616. now = time()
  617. prev_energy[power_plane], energy_w = (
  618. (energy_j, now),
  619. (energy_j - prev_energy[power_plane][0]) / (now - prev_energy[power_plane][1]),
  620. )
  621. stats2[power_plane] = '{:.1f} W'.format(energy_w)
  622. output2 = ('{:s}: {:s}'.format(label, stats2[label]) for label in stats2)
  623. terminator = '\n' if args.log else '\r'
  624. log(
  625. '[{}] {} || {}{}'.format(power['source'], ' - '.join(output), ' - '.join(output2), ' ' * 10),
  626. end=terminator,
  627. )
  628. exit_event.wait(wait)
  629. def main():
  630. global args
  631. parser = argparse.ArgumentParser()
  632. exclusive_group = parser.add_mutually_exclusive_group()
  633. exclusive_group.add_argument('--debug', action='store_true', help='add some debug info and additional checks')
  634. exclusive_group.add_argument(
  635. '--monitor',
  636. metavar='update_rate',
  637. const=1.0,
  638. type=float,
  639. nargs='?',
  640. help='realtime monitoring of throttling causes (default 1s)',
  641. )
  642. parser.add_argument('--config', default='/etc/lenovo_fix.conf', help='override default config file path')
  643. parser.add_argument('--force', action='store_true', help='bypass compatibility checks (EXPERTS only)')
  644. parser.add_argument('--log', metavar='/path/to/file', help='log to file instead of stdout')
  645. args = parser.parse_args()
  646. if args.log:
  647. try:
  648. args.log = open(args.log, 'w')
  649. except:
  650. args.log = None
  651. fatal('Unable to write to the log file!')
  652. if not args.force:
  653. check_kernel()
  654. check_cpu()
  655. log('[I] Loading config file.')
  656. config = load_config()
  657. power['source'] = 'BATTERY' if is_on_battery(config) else 'AC'
  658. platform_info = get_cpu_platform_info()
  659. if args.debug:
  660. for key, value in platform_info.items():
  661. log('[D] cpu platform info: {} = {}'.format(key.replace("_", " "), value))
  662. regs = calc_reg_values(platform_info, config)
  663. if not config.getboolean('GENERAL', 'Enabled'):
  664. return
  665. exit_event = Event()
  666. thread = Thread(target=power_thread, args=(config, regs, exit_event))
  667. thread.daemon = True
  668. thread.start()
  669. undervolt(config)
  670. set_icc_max(config)
  671. # handle dbus events for applying undervolt/IccMax on resume from sleep/hybernate
  672. def handle_sleep_callback(sleeping):
  673. if not sleeping:
  674. undervolt(config)
  675. set_icc_max(config)
  676. def handle_ac_callback(*args):
  677. try:
  678. power['source'] = 'BATTERY' if args[1]['Online'] == 0 else 'AC'
  679. power['method'] = 'dbus'
  680. except:
  681. power['method'] = 'polling'
  682. DBusGMainLoop(set_as_default=True)
  683. bus = dbus.SystemBus()
  684. # add dbus receiver only if undervolt/IccMax is enabled in config
  685. if any(
  686. config.getfloat(key, plane, fallback=0) != 0 for plane in VOLTAGE_PLANES for key in UNDERVOLT_KEYS + ICCMAX_KEYS
  687. ):
  688. bus.add_signal_receiver(
  689. handle_sleep_callback, 'PrepareForSleep', 'org.freedesktop.login1.Manager', 'org.freedesktop.login1'
  690. )
  691. bus.add_signal_receiver(
  692. handle_ac_callback,
  693. signal_name="PropertiesChanged",
  694. dbus_interface="org.freedesktop.DBus.Properties",
  695. path="/org/freedesktop/UPower/devices/line_power_AC",
  696. )
  697. log('[I] Starting main loop.')
  698. if args.monitor is not None:
  699. monitor_thread = Thread(target=monitor, args=(exit_event, args.monitor))
  700. monitor_thread.daemon = True
  701. monitor_thread.start()
  702. try:
  703. loop = GLib.MainLoop()
  704. loop.run()
  705. except (KeyboardInterrupt, SystemExit):
  706. pass
  707. exit_event.set()
  708. loop.quit()
  709. thread.join(timeout=1)
  710. if args.monitor is not None:
  711. monitor_thread.join(timeout=0.1)
  712. if __name__ == '__main__':
  713. main()