realname "Montgomery Reduction (x86-64)" mp_bits 64 load_on never mp_monty.S amd64 gcc icc # ELF systems linux freebsd netbsd openbsd solaris asm_ia32