<!-- MHonArc v2.6.19 -->
<!--X-Subject: Re: [PATCH v2 &#45;tip] x86/percpu: Use C for arch_raw_cpu_ptr() -->
<!--X-From-R13: Zvahf Fbeinyqf &#60;gbeinyqfNyvahk&#45;sbhaqngvba.bet> -->
<!--X-Date: Thu, 19 Oct 2023 18:39:38 &#45;0400 (EDT) -->
<!--X-Message-Id: CAHk&#45;=wjvHDp+oiC4UZxivF6fCjKWFAAzgBYZdng6qe+ED6rLTg@mail.gmail.com -->
<!--X-Content-Type: text/plain -->
<!--X-Reference: 20231010164234.140750&#45;1&#45;ubizjak@gmail.com -->
<!--X-Reference: CAHk&#45;=whYWhZN52SJN&#45;Th9x2L2V&#45;vHtAXUgiy_nSJ3+vQU6ak4Q@mail.gmail.com -->
<!--X-Reference: CAFULd4ZqH3FeG8_mjDvUAU9QiGB36wDu3MzUtadgAgoVuQ9QRg@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wiALZxieQQmvv5sW15HYB_YwC3d_ma9sdp7Zb4Fb4uK2w@mail.gmail.com -->
<!--X-Reference: F48A9D34&#45;3627&#45;4372&#45;B555&#45;B58CBFC3F241@vmware.com -->
<!--X-Reference: CAHk&#45;=wjF4gzCZKh&#45;zN&#45;sY0WpX1kCo+s9gYE9sOcSv0QieH1dwQ@mail.gmail.com -->
<!--X-Reference: CAFULd4bmOa7G2dXd_mu4J=_bsEs+TbxH691tYx9QQBwJPAma9w@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wj2Co_g3RQ=JkDZC7PYbRqDPq7mePQ0=eYhhtpEgqJD0w@mail.gmail.com -->
<!--X-Reference: 0617BB2F&#45;D08F&#45;410F&#45;A6EE&#45;4135BB03863C@vmware.com -->
<!--X-Reference: CAFULd4Zjd6idrLXuF59cwKxyd1a&#45;&#45;DsiJwGQAKai9Tph30dAow@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wgSsfo89ESHcngvPCkQSh_YAJG&#45;0g7fupb+Uv0E1d_EcQ@mail.gmail.com -->
<!--X-Reference: 7D77A452&#45;E61E&#45;4B8B&#45;B49C&#45;949E1C8E257C@vmware.com -->
<!--X-Reference: CAHk&#45;=wj1dLFkL9Qv2vtk0O8Q6WE&#45;11Jq3KucZoz2Kkw59LAexw@mail.gmail.com -->
<!--X-Reference: 9F926586&#45;20D9&#45;4979&#45;AB7A&#45;71124BBAABD3@vmware.com -->
<!--X-Reference: CAHk&#45;=wi7YKPKKZw5SpA9gZcf4paG4pZ2kUM50g&#45;LQmdF0g6vWg@mail.gmail.com -->
<!--X-Reference: CAFULd4bpHkNzCzKed23mTTBWRyhPnOm91f+F6UE413VK+oFtMQ@mail.gmail.com -->
<!--X-Reference: CAFULd4Z&#45;q4Ot6iyOLo7DkjE=dY3RHXUV+yx6R0iWk=&#45;tZ6ufhQ@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wjSnECwAe+Bi0PD6uods3ZDs8up5OAy&#45;qZKF5OgPLpDiA@mail.gmail.com -->
<!--X-Reference: CAFULd4bLEU&#45;tBC8dO1wf66UAxQ2d1HxQ=D6wvtHZfdQCKhnpkw@mail.gmail.com -->
<!--X-Reference: CAFULd4YAFTFqon3ojv7N6h=G_1pAjSH3T6YvX0G=g7Fwh7j1jQ@mail.gmail.com -->
<!--X-Reference: A2E458DE&#45;8B84&#45;4FB2&#45;BF6D&#45;3EAB2B355078@vmware.com -->
<!--X-Reference: CAFULd4b_PdKb=8U5+Zz&#45;XNoYdULtcQJnmf&#45;yCrpCv7RRogSXyQ@mail.gmail.com -->
<!--X-Reference: CAFULd4Y8_MOMGcatcMuUaC89zX5F&#45;VYr0niiJ9Yd8hQ16neHjw@mail.gmail.com -->
<!--X-Reference: 3F9D776E&#45;AD7E&#45;4814&#45;9E3C&#45;508550AD9287@vmware.com -->
<!--X-Reference: CAFULd4Zruoq4b5imt3NfN4D+0RY2&#45;i==KGAwUHR8JD0T8=HJBw@mail.gmail.com -->
<!--X-Reference: 28B9471C&#45;4FB0&#45;4AB0&#45;81DD&#45;4885C3645E95@vmware.com -->
<!--X-Reference: CAHk&#45;=whS8&#45;Lk_=mFp=mr&#45;JrbRYtScgz&#45;4s_GLAOQGafa_3zP9g@mail.gmail.com -->
<!--X-Reference: CAFULd4Yy&#45;v40tK94rexSOL99FGMke2Jk42wgcjoEBxV=2hXoCw@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wjrLoy6xEDXB=piEUagDLMmV5Up7UK75W1D0E0UFVO&#45;iA@mail.gmail.com -->
<!--X-Reference: CAFULd4autFT=96EckL9vUDgO5t0ESp27+NDVXQHGi7N=PAo&#45;HQ@mail.gmail.com -->
<!--X-Reference: CAFULd4Zhw=zoDtir03FdPxJD15GZ5N=SV9=4Z45_Q_P9BL1rvQ@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wgoWOcToLYbuL2GccbNXwj_MH&#45;LxmB_7MMjw6uu50k57Q@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wgCPbkf0Kdi=4T3LAVvNEH0jxJBWcTiBkrFDBsxkC9mKQ@mail.gmail.com -->
<!--X-Reference: CAFULd4aTY002A7NHRCX21aTpYOE=tnpouBk6hkoeWND=LnT4ww@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wia9vFmyCJPkYg0vvegF8eojLy+DxVtpfoDv&#45;UHoWKfqQ@mail.gmail.com -->
<!--X-Reference: CAFULd4Zj5hTvATZUVYhUGrxH3fiAUWjO9C27UV_USf2H164thQ@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=whEc2HR3En32uyAufPM3tEh8J4+dot6JyGW=Eg5SEhx7A@mail.gmail.com -->
<!--X-Reference: CAFULd4avm_TaEoRauohRc90SUrx&#45;D+wBJvg+htQDQ1_N=zNemw@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wijmmRB7&#45;ZeT&#45;sdxCSUoB83Lb5dnN7a7mCcH3cRw_aghQ@mail.gmail.com -->
<!--X-Reference: CAFULd4b91Tr9Q2p4a20eusC+QO6O81gxY+nP&#45;zpFiFKGTmLpYg@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wi3LZ_4OGAMhvgO0JSTp&#45;eEPOGp+siq1nJNLY1JAxdP5Q@mail.gmail.com -->
<!--X-Reference: CAFULd4YxvMtTEfQL&#45;RiLisTxDwoJZZxXXB+3CWqCpzZkUf85JA@mail.gmail.com -->
<!--X-Reference: CAHk&#45;=wj8qEwR1eGeJdup2q90WK7ZWBjpcXJEBi&#45;TBp29p0n8oQ@mail.gmail.com -->
<!--X-Head-End-->
<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN"
                      "http://www.w3.org/TR/REC-html40/loose.dtd">
<html>
<head>
<meta HTTP-EQUIV="Content-Type" CONTENT="text/html; charset=iso-8859-2">
<title>Linux-Kernel Archive: Re: [PATCH v2 -tip] x86/percpu: Use C for arch_raw_cpu_ptr()</title>
<meta NAME="Author" CONTENT="Linus Torvalds &lt;torvalds@xxxxxxxxxxxxxxxxxxxx&gt;">
<meta NAME="Subject" CONTENT="Re: [PATCH v2 -tip] x86/percpu: Use C for arch_raw_cpu_ptr()">
</head> 
<body BGCOLOR="#FFFFFF" TEXT="#000000">

<!--X-Body-Begin-->
<!--X-User-Header-->
<!--X-User-Header-End-->
<!--X-TopPNI-->


<!--X-TopPNI-End-->
<!--X-MsgBody-->
<!--X-Subject-Header-Begin-->
<h1>Re: [PATCH v2 -tip] x86/percpu: Use C for arch_raw_cpu_ptr()</h1>
<strong>From: </strong>Linus Torvalds
<br><strong>Date: </strong> Thu Oct 19 2023 - 18:39:38 EST
<p>
<ul>
<li><strong>Next message: </strong> <a href="06587.html"> Jayant Chowdhary: "[PATCH] usb:gadget:uvc: Add super speed plus descriptors"</a>

<li><strong>Previous message: </strong> <a href="06585.html"> Alex Williamson: "Re: [PATCH v17 1/2] vfio/migration: Add debugfs to live migration driver"</a>

<li><strong>In reply to: </strong> <a href="06516.html"> Linus Torvalds: "Re: [PATCH v2 -tip] x86/percpu: Use C for arch_raw_cpu_ptr()"</a>

<li><strong>Next in thread: </strong> <a href="06931.html"> Uros Bizjak: "Re: [PATCH v2 -tip] x86/percpu: Use C for arch_raw_cpu_ptr()"</a>

<li><strong>Messages sorted by: </strong><a href="date.html#06586">[ date ]</a> <a href="index.html#06586">[ thread ]</a> <a href="subject.html#06586">[ subject ]</a> <a href="author.html#06586">[ author ]</a>
</ul>

<!--X-Subject-Header-End-->
<!--X-Head-of-Message-->
<!--X-Head-of-Message-End-->
<!--X-Head-Body-Sep-Begin-->
<hr NOSHADE>
<!--X-Head-Body-Sep-End-->
<!--X-Body-of-Message-->
Unrelated question to the gcc people (well, related in the way that<br>
this discussion made me *test* this).<br>
<br>
Lookie here:<br>
<br>
    int test(void)<br>
    {<br>
        unsigned int sum = 0;<br>
        for (int i = 0; i &lt; 4; i++) {<br>
                unsigned int val;<br>
    #if ONE<br>
                asm(&quot;magic1 %0&quot;:&quot;=r&quot; (val): :&quot;memory&quot;);<br>
    #else<br>
                asm volatile(&quot;magic2 %0&quot;:&quot;=r&quot; (val));<br>
    #endif<br>
                sum += val;<br>
        }<br>
        return sum;<br>
    }<br>
<br>
and now build this with<br>
<br>
    gcc -O2 -S -DONE -funroll-all-loops t.c<br>
<br>
and I get a *completely* nonsensical end result. What gcc generates is<br>
literally insane.<br>
<br>
What I *expected* to happen was that the two cases (with &quot;-DONE&quot; and<br>
without) would generate the same code, since one has a &quot;asm volatile&quot;,<br>
and the other has a memory clobber.<br>
<br>
IOW, neither really should be something that can be combined.<br>
<br>
But no. The '-DONE&quot; version is completely crazy with my gcc-13.2.1 setup.<br>
<br>
First off, it does actually CSE all the asm's despite the memory<br>
clobber. Which I find quite debatable, but whatever.<br>
<br>
But not only does it CSE them, it then does *not* just multiply the<br>
result by four. No. It generates this insanity:<br>
<br>
        magic1 %eax<br>
        movl    %eax, %edx<br>
        addl    %eax, %eax<br>
        addl    %edx, %eax<br>
        addl    %edx, %eax<br>
        ret<br>
<br>
so it has apparently done the CSE _after_ the other optimizations.<br>
<br>
Very strange.<br>
<br>
Honestly, the CSE part looks like an obvious bug to me. The gcc<br>
documentation states:<br>
<br>
     The &quot;memory&quot; clobber tells the compiler that the assembly code<br>
     performs memory reads or writes to items other than those listed in<br>
     the input and output operands (for example, accessing the memory<br>
     pointed to by one of the input parameters).<br>
<br>
so CSE'ing any inline asm with a memory clobber sounds *very* dubious.<br>
The asm literally told the compiler that it has side effects in<br>
unrelated memory locations!<br>
<br>
I don't think we actually care in the kernel (and yes, I think it<br>
would always be safer to use &quot;asm volatile&quot; if there's some unrelated<br>
memory locations that change), but since I was testing this and was<br>
surprised, and since the obvious reading of the documented behavior of<br>
a memory clobber really does scream &quot;you can't combine those asms&quot;, I<br>
thought I'd mention this.<br>
<br>
Also, *without* the memory clobber, gcc obviously still does CSE the<br>
asm, but also, gcc ends up doing just<br>
<br>
        magic1 %eax<br>
        sall    $2, %eax<br>
        ret<br>
<br>
so the memory clobber clearly does actually make a difference. Just<br>
not a _sane_ one.<br>
<br>
In testing, clang does *not* have this apparently buggy behavior (but<br>
clang annoyingly actually checks the instruction mnemonics, so I had<br>
to change &quot;magic&quot; into &quot;strl&quot; instead to make clang happy).<br>
<br>
Hmm?<br>
<br>
                  Linus<br>
<br>
<br>

<!--X-Body-of-Message-End-->
<!--X-MsgBody-End-->
<!--X-Follow-Ups-->
<hr NOSHADE>


</ul></li></ul>
<!--X-Follow-Ups-End-->
<!--X-References-->


<!--X-References-End-->
<!--X-BotPNI-->
<ul>
<li><strong>Next message: </strong> <a href="06587.html"> Jayant Chowdhary: "[PATCH] usb:gadget:uvc: Add super speed plus descriptors"</a>

<li><strong>Previous message: </strong> <a href="06585.html"> Alex Williamson: "Re: [PATCH v17 1/2] vfio/migration: Add debugfs to live migration driver"</a>

<li><strong>In reply to: </strong> <a href="06516.html"> Linus Torvalds: "Re: [PATCH v2 -tip] x86/percpu: Use C for arch_raw_cpu_ptr()"</a>

<li><strong>Next in thread: </strong> <a href="06931.html"> Uros Bizjak: "Re: [PATCH v2 -tip] x86/percpu: Use C for arch_raw_cpu_ptr()"</a>

<li><strong>Messages sorted by: </strong><a href="date.html#06586">[ date ]</a> <a href="index.html#06586">[ thread ]</a> <a href="subject.html#06586">[ subject ]</a> <a href="author.html#06586">[ author ]</a>
</ul>

<!--X-BotPNI-End-->
<!--X-User-Footer-->
<!--X-User-Footer-End-->
</body>
</html>