如何優雅地利用c++程式設計從1乘到20？

「已登出」2020-01-11 13:06:34

#include

template

uint64_t

constexpr

uint64_t

fact

；

template

constexpr

uint64_t

fact

；

using

namespace

std

；

int

main

（）

{

cout

fact

endl

；

return

；

}

別的騷操作咱也不會，就先在這裡放個模板的。

CuKing2020-01-11 17:03:09

#include

int

main

（）

{

long

；

long

=！

；

long

；

long

；

long

；

long

；

long

；

long

；

long

；

long

；

long

；

long

；

long

；

long

；

long

；

long

（

）；

long

；

long

=！！

；

long

；

long

=++

；

long

；

printf

（

“%I64d”

，

）；

}

知乎使用者2020-01-12 01:00:57

數學家版本：

#include

int

main

（）

{

std

：：

cout

std

：：

tgamma

（

）

std

：：

endl

；

}

語言學家版本：

#include

template

std

：：

size_t

。。。

constexpr

auto

foo

（

std

：：

index_sequence

。。。

）

{

return

（（

）

。。。）；

}

int

main

（）

{

std

：：

cout

foo

（

std

：：

make_index_sequence

（））

std

：：

endl

；

}

“快速”版本：

#include

long

foo

（

int

，

int

，

std

：：

future

long

last

std

：：

async

（

std

：：

integral_constant

long

，

（）））

{

return

？

last

。

get

（）

：

foo

（（

）

，

std

：：

async

（

foo

，

（

）

，

std

：：

move

（

last

）））；

}

int

main

（）

{

std

：：

cout

foo

（

，

）

std

：：

endl

；

}

歷史學家版本：

#include

void

main

（

void

）

{

int

；

long

；

for

（

，

；

）；

printf

（

“%lld”

，

）；

}

敏捷開發上線1。0版本：

#include

int

main

（）

{

//printf（“%d”， 1*2*3*4*5*6*7*8*9*10）；

printf

（

“%lld”

，

（

long

）

）；

}

面向物件專家版本：

#include

struct

IBaseInterface

{

virtual

IBaseInterface

（）

；

}；

inline

IBaseInterface

：：~

IBaseInterface

（）

default

；

struct

IDataProvider

：

virtual

public

IBaseInterface

{

virtual

int

first

（）

；

virtual

int

last

（）

；

virtual

int

（

int

）

；

}；

struct

ICalculator

：

virtual

public

IBaseInterface

{

virtual

long

calc

（

IDataProvider

）

；

}；

struct

IPrinter

：

virtual

public

IBaseInterface

{

virtual

void

（

const

std

：：

string

）

；

}；

struct

ISerializer

：

virtual

public

IBaseInterface

{

virtual

std

：：

string

serialize

（

long

value

）

；

}；

struct

IRunnable

：

virtual

public

IBaseInterface

{

virtual

void

run

（）

；

}；

class

Foo

：

virtual

public

IRunnable

{

std

：：

shared_ptr

IDataProvider

m_dp

；

std

：：

shared_ptr

ICalculator

m_c

；

std

：：

shared_ptr

ISerializer

m_s

；

std

：：

shared_ptr

IPrinter

m_p

；

public

：

Foo

（

std

：：

shared_ptr

IDataProvider

，

std

：：

shared_ptr

ICalculator

，

std

：：

shared_ptr

ISerializer

，

std

：：

shared_ptr

IPrinter

）

：

m_dp

（

std

：：

move

（

）），

m_c

（

std

：：

move

（

）），

m_s

（

std

：：

move

（

）），

m_p

（

std

：：

move

（

））

{}

void

run

（）

override

{

return

m_p

（

m_s

serialize

（

m_c

calc

（

m_dp

。

get

（））））；

}

}；

class

DefaultSerializer

：

virtual

public

ISerializer

{

public

：

std

：：

string

serialize

（

long

value

）

override

{

return

std

：：

to_string

（

value

）；

}

}；

class

StreamPrinter

：

virtual

public

IPrinter

{

std

：：

ostream

m_os

；

public

：

explicit

StreamPrinter

（

std

：：

ostream

）

：

m_os

（

）

{}

void

（

const

std

：：

string

）

override

{

m_os

std

：：

endl

；

}

}；

class

MultiplyAccumulateCalculator

：

virtual

public

ICalculator

{

public

：

long

calc

（

IDataProvider

）

override

{

int

first

（）；

long

；

（

））；

while

（

！=

last

（））；

return

；

}

}；

int

main

（）

{

struct

MyDataProvider

：

virtual

public

IDataProvider

{

int

first

（）

override

{

return

；

}

int

last

（）

override

{

return

；

}

int

（

int

）

override

{

return

；

}

}；

Foo

foo

（

std

：：

make_shared

MyDataProvider

（），

std

：：

make_shared

MultiplyAccumulateCalculator

（），

std

：：

make_shared

DefaultSerializer

（），

std

：：

make_shared

StreamPrinter

（

std

：：

cout

））；

foo

。

run

（）；

}

提前最佳化的並行版本：

#include

double

foo

（

int

）

{

__m128

{

1。0f

，

2。0f

，

3。0f

，

4。0f

}；

__m128

{

4。0f

，

4。0f

，

4。0f

，

4。0f

}；

__m128

{

1。0f

，

1。0f

，

1。0f

，

1。0f

}；

for

（

int

；

，

_mm_add_ps

（

，

））

_mm_mul_ps

（

，

）；

for

（

int

；

）

［

］

1。0f

；

_mm_mul_ps

（

，

）；

return

（

double

）

［

］

（

double

）

［

］

（

double

）

［

］

（

double

）

［

］；

}

int

main

（）

{

std

：：

cout

foo

（

）

std

：：

endl

；

}

“宏孩兒”超程式設計版：

#include

// 由於boost。preprocessor僅提供255以下的整數運算

// 所以使用sequence來（十位個位）（千位百位）（十萬位萬位）的方式來表示大整數。

// 不進位加法：（77）（66）（55） + （44）（33）（22） = （121）（99）（77）

#define PP_ADD_N_N_CARRY_OP（R， DATA， I， ELEM）（BOOST_PP_ADD（BOOST_PP_SEQ_ELEM（I， DATA）， ELEM））

#define PP_ADD_N_N_CARRY（SEQ_A， SEQ_B） BOOST_PP_SEQ_FOR_EACH_I（PP_ADD_N_N_CARRY_OP， SEQ_A， SEQ_B）

// 進位加法：（121）（99）（77） = （21）（0）（78）

// 注意SEQ_A的長度要比SEQ_B長

#define PP_ADD_N_N_OP（S， STATE， ELEM_CARRY） \

BOOST_PP_SEQ_PUSH_FRONT（ \

BOOST_PP_SEQ_REPLACE（STATE， 0， BOOST_PP_MOD（BOOST_PP_ADD（BOOST_PP_SEQ_HEAD（STATE）， ELEM_CARRY）， 100））， \

BOOST_PP_DIV（BOOST_PP_ADD（BOOST_PP_SEQ_HEAD（STATE）， ELEM_CARRY）， 100） \

）

#define PP_ADD_N_N（SEQ_A， SEQ_B） BOOST_PP_SEQ_REVERSE（BOOST_PP_SEQ_FOLD_LEFT（PP_ADD_N_N_OP， BOOST_PP_SEQ_NIL（0）， PP_ADD_N_N_CARRY（SEQ_A， SEQ_B）））

// 沒什麼好說的，X*N = X+X+X+X+X+。。。+X

#define PP_MUL_N_1_EXP_OP（Z， I， DATA）（DATA）

#define PP_MUL_N_1_EXP（SEQ_N， N） BOOST_PP_REPEAT（N， PP_MUL_N_1_EXP_OP， SEQ_N）

#define PP_MUL_N_1_MYOP（S， STATE， ITEM） PP_ADD_N_N（STATE， ITEM）

#define PP_MUL_N_1_FWD（EXP） BOOST_PP_SEQ_FOLD_LEFT（PP_MUL_N_1_MYOP， BOOST_PP_SEQ_HEAD（EXP）， BOOST_PP_SEQ_TAIL（EXP））

#define PP_MUL_N_1（SEQ_N， N） PP_MUL_N_1_FWD（PP_MUL_N_1_EXP（SEQ_N， N））

#define FACT5 PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（（1）， 2）， 3）， 4）， 5）

#define FACT10 PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（FACT5， 6）， 7）， 8）， 9）， 10）

#define FACT15 PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（FACT10， 11）， 12）， 13）， 14）， 15）

#define FACT20 PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（FACT15， 16）， 17）， 18）， 19）， 20）

#define FACT25 PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（PP_MUL_N_1（FACT20， 21）， 22）， 23）， 24）， 25）

static_assert

（

false

，

BOOST_PP_STRINGIZE

（

FACT10

））；

警告：目前只有Clang能算出FACT20，編譯緩慢是十分正常的，請耐心等待。預設計算10的階乘10！=3628800，期待輸出：

error： static_assert failed “（0）（88）（62）（3）（0）（0）（0）（0）（0）（0）”

真·模板超程式設計版本（大整數）

#include

using

BaseType_t

long

；

constexpr

BaseType_t

lgBase

；

// 注意10000*10000剛剛好小於int的取值範圍

constexpr

BaseType_t

Base

1000000000

；

// 注意10000*10000剛剛好小於int的取值範圍

// 大整數的表示

template

BaseType_t

。。。

struct

BigInteger

{

using

type

BigInteger

；

}；

// 連線

template

class

，

class

struct

BI_Cat

；

template

BaseType_t

。。。

，

BaseType_t

。。。

struct

BI_Cat

BigInteger

。。。

，

BigInteger

。。。

：

BigInteger

。。。，

。。。

{}；

// 左移一個單元（即*Base）

template

class

struct

BI_SHL

；

template

BaseType_t

。。。

struct

BI_SHL

BigInteger

。。。

：

BigInteger

。。。，

{}；

// 去除開頭的0

template

class

struct

BI_Remove_Zeros

：

{}；

template

BaseType_t

。。。

struct

BI_Remove_Zeros

BigInteger

，

。。。

：

BI_Remove_Zeros

BigInteger

。。。

{}；

// 填充0到N個單元

template

int

，

class

struct

BI_Fill_Impl

；

template

int

，

class

，

。。。

struct

BI_Fill_Impl

，

std

：：

integer_sequence

，

。。。

：

BigInteger

（

，

）。。。

{}；

template

int

Size

struct

BI_Fill_Zeros

：

BI_Fill_Impl

，

std

：：

make_index_sequence

Size

{}；

template

class

，

int

struct

BI_Resize

；

template

BaseType_t

。。。

，

int

struct

BI_Resize

BigInteger

。。。

，

：

BI_Cat

typename

BI_Fill_Zeros

sizeof

。。。（

）

>：：

type

，

BigInteger

。。。

{}；

// 返回較大的數值

template

int

，

int

struct

int_min

：

std

：：

integral_constant

int

，

（

？

：

）

{}；

// 非進位加法：先把兩個數的位數改成一樣的然後依次相加

template

class

，

class

，

class

ShouldResize

struct

BI_AddNotCarry_Impl

；

template

BaseType_t

。。。

，

BaseType_t

。。。

struct

BI_AddNotCarry_Impl

BigInteger

。。。

，

BigInteger

。。。

，

std

：：

true_type

：

BigInteger

（

）。。。

{}；

template

BaseType_t

。。。

，

BaseType_t

。。。

struct

BI_AddNotCarry_Impl

BigInteger

。。。

，

BigInteger

。。。

，

std

：：

false_type

：

BI_AddNotCarry_Impl

typename

BI_Resize

BigInteger

。。。

，

int_min

sizeof

。。。（

），

sizeof

。。。（

）

>：：

value

>：：

type

，

typename

BI_Resize

BigInteger

。。。

，

int_min

sizeof

。。。（

），

sizeof

。。。（

）

>：：

value

>：：

type

，

std

：：

true_type

{}；

template

class

，

class

struct

BI_AddNotCarry

；

template

BaseType_t

。。。

，

BaseType_t

。。。

struct

BI_AddNotCarry

BigInteger

。。。

，

BigInteger

。。。

：

BI_AddNotCarry_Impl

BigInteger

。。。

，

BigInteger

。。。

，

std

：：

bool_constant

sizeof

。。。（

）

sizeof

。。。（

）

{}；

// 判斷是否為0

template

class

struct

BI_IsZero

；

template

BaseType_t

。。。

struct

BI_IsZero

BigInteger

。。。

：

std

：：

bool_constant

（（

）

。。。）

{}；

// 自動進位

template

class

struct

BI_Carry

；

template

class

，

class

struct

BI_Add

：

BI_Carry

typename

BI_AddNotCarry

，

>：：

type

{}；

template

class

Mod

，

class

Div

，

class

ShouldCalc

typename

BI_IsZero

Div

>：：

type

struct

BI_Carry_Impl

；

template

class

Mod

，

class

Div

struct

BI_Carry_Impl

Mod

，

Div

，

std

：：

true_type

：

Mod

{}；

template

class

Mod

，

class

Div

struct

BI_Carry_Impl

Mod

，

Div

，

std

：：

false_type

：

BI_Add

Mod

，

typename

BI_SHL

Div

>：：

type

{}；

template

BaseType_t

。。。

struct

BI_Carry

BigInteger

。。。

：

BI_Remove_Zeros

typename

BI_Carry_Impl

BigInteger

（

Base

）。。。

，

BigInteger

（

Base

）。。。

>>：：

type

{}；

// 乘以X並自動進位

template

class

，

int

struct

BI_MulX

；

template

BaseType_t

。。。

，

int

struct

BI_MulX

BigInteger

。。。

，

：

BI_Carry

BigInteger

（

）。。。

{}；

// 計算階乘

template

int

struct

BI_Fact

：

BI_MulX

typename

BI_Fact

>：：

type

，

{}；

template

struct

BI_Fact

：

BigInteger

{}；

template

BaseType_t

。。。

std

：：

ostream

operator

（

std

：：

ostream

out

，

BigInteger

。。。

）

{

return

（（

out

std

：：

setfill

（

‘0’

）

std

：：

setw

（

lgBase

）），

。。。）；

}

int

main

（）

{

std

：：

cout

typename

BI_Fact

>：：

type

（）

std

：：

endl

；

}

如果將BI_Fact<20>改為BI_Fact<1000>後，我們可愛的Clang直譯器花了3秒多的時間很偷稅地算出來了1000！ =

402387260077093773543702433923003985719374864210714632543799910429938512398629020592044208486969404800479988610197196058631666872994808558901323829669944590997424504087073759918823627727188732519779505950995276120874975462497043601418278094646496291056393887437886487337119181045825783647849977012476632889835955735432513185323958463075557409114262417474349347553428646576611667797396668820291207379143853719588249808126867838374559731746136085379534524221586593201928090878297308431392844403281231558611036976801357304216168747609675871348312025478589320767169132448426236131412508780208000261683151027341827977704784635868170164365024153691398281264810213092761244896359928705114964975419909342221566832572080821333186116811553615836546984046708975602900950537616475847728421889679646244945160765353408198901385442487984959953319101723355556602139450399736280750137837615307127761926849034352625200015888535147331611702103968175921510907788019393178114194545257223865541461062892187960223838971476088506276862967146674697562911234082439208160153780889893964518263243671616762179168909779911903754031274622289988005195444414282012187361745992642956581746628302955570299024324153181617210465832036786906117260158783520751516284225540265170483304226143974286933061690897968482590125458327168226458066526769958652682272807075781391858178889652208164348344825993266043367660176999612831860788386150279465955131156552036093988180612138558600301435694527224206344631797460594682573103790084024432438465657245014402821885252470935190620929023136493273497565513958720559654228749774011413346962715422845862377387538230483865688976461927383814900140767310446640259899490222221765904339901886018566526485061799702356193897017860040811889729918311021171229845901641921068884387121855646124960798722908519296819372388642614839657382291123125024186649353143970137428531926649875337218940694281434118520158014123344828015051399694290153483077644569099073152433278288269864602789864321139083506217095002597389863554277196742822248757586765752344220207573630569498825087968928162753848863396909959826280956121450994871701244516461260379029309120889086942028510640182154399457156805941872748998094254742173582401063677404595741785160829230135358081840096996372524230560855903700624271243416909004153690105933983835777939410970027753472000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000

無人值守自動迭代版本

#include

int

main

（）

{

std

：：

vector

int

（

std

：：

atoi

（

std

：：

end

（

__DATE__

）

（

__LINE__

）

））；

// 2020年，第六行

std

：：

iota

（

。

begin

（），

。

end

（），

）；

std

：：

cout

std

：：

accumulate

（

。

begin

（），

。

end

（），

1ull

，

std

：：

multiplies

（））

std

：：

endl

；

}

模板超程式設計版本（二進位制）

#include

using

Zero

std

：：

integer_sequence

bool

；

using

One

std

：：

integer_sequence

bool

，

true

；

template

class

struct

type_identity

：

std

：：

enable_if

true

，

{}；

// *2

template

class

struct

shl

；

template

bool

。。。

struct

shl

std

：：

integer_sequence

bool

，

。。。

：

type_identity

std

：：

integer_sequence

bool

，

false

，

。。。

{}；

// *2+1

template

class

struct

shl_inc

；

template

bool

。。。

struct

shl_inc

std

：：

integer_sequence

bool

，

。。。

：

type_identity

std

：：

integer_sequence

bool

，

true

，

。。。

{}；

// /2

template

class

struct

shr

；

template

bool

First

，

bool

。。。

Rest

struct

shr

std

：：

integer_sequence

bool

，

First

，

Rest

。。。

：

type_identity

std

：：

integer_sequence

bool

，

Rest

。。。

{}；

// +1

template

class

struct

inc

；

template

struct

inc

Zero

：

type_identity

One

{}；

template

bool

。。。

struct

inc

std

：：

integer_sequence

bool

，

true

，

。。。

：

shl

typename

inc

std

：：

integer_sequence

bool

，

。。。

>>：：

type

{}；

template

bool

。。。

struct

inc

std

：：

integer_sequence

bool

，

false

，

。。。

：

type_identity

std

：：

integer_sequence

bool

，

true

，

。。。

{}；

// -1

template

class

struct

dec

；

template

bool

。。。

struct

dec

std

：：

integer_sequence

bool

，

true

，

。。。

：

type_identity

std

：：

integer_sequence

bool

，

false

，

。。。

{}；

template

bool

。。。

struct

dec

std

：：

integer_sequence

bool

，

false

，

。。。

：

shl_inc

typename

dec

std

：：

integer_sequence

bool

，

。。。

>>：：

type

{}；

// 取最低位

template

class

struct

lowest

：

std

：：

false_type

{}；

template

bool

First

，

bool

。。。

Rest

struct

lowest

std

：：

integer_sequence

bool

，

First

，

Rest

。。。

：

std

：：

bool_constant

First

{}；

// 擴充套件位數

template

class

struct

ext

；

template

bool

。。。

struct

ext

std

：：

integer_sequence

bool

，

。。。

：

type_identity

std

：：

integer_sequence

bool

，

。。。，

false

{}；

// 比較兩個數是否相等

template

class

，

class

struct

test

；

template

bool

。。。

，

bool

。。。

struct

test

std

：：

integer_sequence

bool

，

。。。

，

std

：：

integer_sequence

bool

，

。。。

：

std

：：

bool_constant

（。。。

（

））

{}；

// 計算位數大小

template

class

struct

len

；

template

struct

len

Zero

：

std

：：

integral_constant

std

：：

size_t

，

{}；

template

bool

。。。

struct

len

std

：：

integer_sequence

bool

，

。。。

：

std

：：

integral_constant

std

：：

size_t

，

sizeof

。。。（

）

{}；

// 去除多餘的高位

template

class

，

bool

not_empty

test

，

>：：

value

struct

shrink

：

type_identity

Zero

{}；

template

bool

。。。

struct

shrink

std

：：

integer_sequence

bool

，

false

，

。。。

，

true

：

shl

typename

shrink

std

：：

integer_sequence

bool

，

。。。

>>：：

type

{}；

template

bool

。。。

struct

shrink

std

：：

integer_sequence

bool

，

true

，

。。。

，

true

：

shl_inc

typename

shrink

std

：：

integer_sequence

bool

，

。。。

>>：：

type

{}；

// 實現超前進位加法器

template

class

，

class

，

bool

loop

test

，

>：：

value

struct

add_impl

：

type_identity

{}；

template

bool

。。。

，

bool

。。。

struct

add_impl

std

：：

integer_sequence

bool

，

。。。

，

std

：：

integer_sequence

bool

，

。。。

，

true

：

add_impl

std

：：

integer_sequence

bool

，

（

）。。。，

false

，

std

：：

integer_sequence

bool

，

false

，

（

）。。。

{}；

// 加法時處理位數不同的情況

template

class

，

class

，

bool

（

len

>：：

value

len

>：：

value

）

struct

add_fill2

：

add_impl

，

{}；

template

class

，

class

struct

add_fill2

，

true

：

add_fill2

，

typename

ext

>：：

type

{}；

template

class

，

class

，

bool

（

len

>：：

value

len

>：：

value

）

struct

add

：

add_fill2

，

{}；

template

class

，

class

struct

add

，

true

：

add

typename

ext

>：：

type

，

{}；

// 實現乘法器

template

class

，

class

，

bool

add

lowest

>：：

value

struct

mul

；

template

class

struct

mul

，

Zero

，

false

：

type_identity

Zero

{}；

template

class

，

class

struct

mul

，

false

：

mul

typename

shl

>：：

type

，

typename

shr

>：：

type

{}；

template

class

，

class

struct

mul

，

true

：

add

typename

mul

typename

shl

>：：

type

，

typename

shr

>：：

type

>：：

type

，

{}；

// 計算階乘

template

class

struct

greater_than_one

：

test

typename

dec

>：：

type

，

typename

dec

>：：

type

{}；

template

class

struct

fact

：

shrink

typename

mul

，

typename

fact

typename

shrink

typename

dec

>：：

type

>：：

type

>：：

type

>：：

type

{}；

template

struct

fact

One

：

type_identity

One

{}；

// 轉換為bitset輸出

template

bool

。。。

，

std

：：

size_t

。。。

auto

ToBitSet

（

std

：：

integer_sequence

bool

，

。。。

，

std

：：

integer_sequence

std

：：

size_t

，

。。。

）

{

std

：：

bitset

sizeof

。。。（

）

ret

；

（。。。，

ret

。

set

（

，

））；

return

ret

；

}

template

bool

。。。

auto

ToBitSet

（

std

：：

integer_sequence

bool

，

。。。

）

{

return

ToBitSet

（

，

std

：：

make_index_sequence

sizeof

。。。（

）

（））；

}

int

main

（）

{

using

F20

fact

std

：：

integer_sequence

bool

，

false

，

false

，

true

，

false

，

true

>>：：

type

；

std

：：

cout

ToBitSet

（

F20

（））。

to_ullong

（）

std

：：

endl

；

//using F31 = fact>：：type；

//std：：cout << ToBitSet（F31（））。to_string（） << std：：endl；

}

注：目前極限是計算到31的階乘，使用MSVC編譯31的階乘需30G記憶體。

更新：

2020-1-12 將“歷史學家”版本修改為void main（void）更具有歷史氣息

2020-1-16 將“快速”二分版本修改為「偽」遞迴呼叫

2020-1-18 並行版本

2020-2-22 宏超程式設計版本

2020-2-24 模板超程式設計版本（大整數）

2020-3-14 無人值守自動迭代版本

2021-10-12 模板超程式設計版本（二進位制）

Aqua2020-02-15 08:41:04

一、可以寫成一個Y組合子：

// NOTE： Only compatible with C++14 or later versions。

#include

int

main

（

int

argc

，

char

argv

［］）

{

// y = λf。（λx。 x x）（λx。 f （λn。（x x） n））

const

auto

［］

（

const

auto

）

{

return

［

］

（

const

auto

）

{

return

（

）；

}

（［

］

（

const

auto

）

std

：：

function

unsigned

long

（

unsigned

long

）

{

return

（［

］

（

unsigned

long

）

{

return

（

）（

）；

}）；

}；

// almost_fac = λf。 λn。 if n > 0 then n × f （n - 1） else 1

const

auto

almost_fac

［］

（

auto

）

{

return

［

］

（

unsigned

long

）

{

return

？

（

）

：

；

}；

std

：：

cout

（

almost_fac

）（

）

std

：：

endl

；

return

；

}

二、可以跟風樓上守序善良一下：

// NOTE： Only tested on x86-64 Linux / macOS。

int

main

（

int

argc

，

char

argv

［］）

{

asm

volatile

（

“（

movq

，

rax

movq

，

rcx

fac

：

mulq

rcx

incq

rcx

cmpq

，

rcx

jle

fac

movq

，

rcx

movq

rsp

，

rbx

movb

，

（

rsp

）

subq

，

rsp

digit

：

xorq

rdx

，

rdx

divq

rcx

addq

，

rdx

movb

，

（

rsp

）

subq

，

rsp

testq

rax

，

rax

jnz

digit

movq

，

rdi

movq

rsp

，

rsi

：

addq

，

rsi

movq

，

rdx

）

”

#ifdef __APPLE__

“movq $0x2000004， %rax”

#else

“movq $1， %rax”

#endif

“（

syscall

movq

rsi

，

rsp

cmpq

rsi

，

rbx

）

”

#ifdef __APPLE__

“movq $0x2000001， %rax”

#else

“movq $60， %rax”

#endif

“（

xorq

rdi

，

rdi

syscall

）

”）；

}

三、上面的程式碼還可以更善良一些：

// NOTE： Only tested on x86-64 Linux / macOS。

constexpr

char

［］

“

\x48\x31\xc0\x48\x31\xc9\x48\xff\xc0\x48\xff\xc1\x48\xf7\xe1\x48\xff\xc1

”

“

\x48\x83\xf9\x14\x0f\x8e\xf0\xff\xff\xff\x48\x31\xc9\x48\x83\xc1\x0a\x48

”

“

\x89\xe3\xc6\x04\x24\x0a\x48\x83\xec\x08\x48\x31\xd2\x48\xf7\xf1\x48\x83

”

“

\xc2\x30\x88\x14\x24\x48\x83\xec\x08\x48\x85\xc0\x0f\x85\xe6\xff\xff\xff

”

“

\x48\x31\xff\x48\xff\xc7\x48\x89\xe6\x48\x83\xc6\x08\x48\x31\xd2\x48\xff

”

“

\xc2

”

#ifdef __APPLE__

“

\x48\xc7\xc0\xff\xff\xff\x01\x48\x83\xc0\x05\x0f\x05\x48\x89\xf4\x48\x39

”

“

\xf3\x90\x0f\x8f\xdc\xff\xff\xff\x48\xc7\xc0\xff\xff\xff\x01\x48\x83\xc0

”

“

\x02

”

#else

“

\x48\x31\xc0\x48\xff\xc0\x0f\x05\x48\x89\xf4\x48\x39\xf3\x0f\x8f\xe2\xff

”

“

\xff\xff\x48\x31\xc0\x48\x83\xc0\x3b\x48\xff\xc0

”

#endif

“

\x48\x31\xff\x0f\x05

”

；

int

main

（

int

argc

，

char

argv

［］）

{

void

nullptr

；

#ifdef __clang__

（

）

（

void

）

；

#else

（

）

（

void

）

；

#endif

return

；

}

四、補一個模版，可惜不是很想寫遞迴：

// NOTE： Only compatible with C++17 or later versions。

#include

namespace

{

template

typename

struct

FactorialHelper

；

template

unsigned

long

。。。

struct

FactorialHelper

std

：：

integer_sequence

unsigned

long

，

。。。

：

public

std

：：

integral_constant

unsigned

long

，

（（

）

。。。）

{}；

template

unsigned

long

using

Factorial

FactorialHelper

std

：：

make_integer_sequence

unsigned

long

，

；

}

// namespace

int

main

（

int

argc

，

char

argv

［］）

{

std

：：

cout

Factorial

>：：

value

std

：：

endl

；

return

；

}

五、模板也可以這麼寫：

// NOTE： Only compatible with C++17 or later versions。

#include

namespace

{

constexpr

size_t

kMaxN

；

template

size_t

struct

Flag

{

friend

constexpr

int

AdlFlag

（

Flag

）；

}；

template

typename

struct

Writer

{

friend

constexpr

int

AdlFlag

（

）

{

return

；

}

}；

template

typename

，

int

AdlFlag

（

{}）

constexpr

size_t

IsAdlFlagDefined

（

int

）

{

return

；

}

template

typename

constexpr

size_t

IsAdlFlagDefined

（。。。）

{

return

；

}

template

size_t

，

size_t

。。。

Sizes

，

size_t

（（

IsAdlFlagDefined

Flag

Sizes

（

））

。。。）

constexpr

size_t

CountDefinedAdlFlags

（

std

：：

integer_sequence

size_t

，

Sizes

。。。

）

{

return

；

}

template

size_t

MaxN

kMaxN

，

size_t

，

typename

std

：：

make_integer_sequence

size_t

，

MaxN

，

size_t

CounterMinus1

CountDefinedAdlFlags

（

{}），

size_t

sizeof

（

Writer

Flag

CounterMinus1

）

using

Counter

std

：：

integral_constant

unsigned

long

，

CounterMinus1

；

}

// namespace

int

main

（

int

argc

，

char

argv

［］）

{

// NOTE： Each ‘Counter<>：：value’ is evaluated separately during the compile

// time thus the following lines cannot be shortened by loops or recursions。

std

：：

cout

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

Counter

<>：：

value

std

：：

endl

；

return

；

}

六、最後，別光折騰CPU，GPU也別讓它閒著：

// NOTE： Only tested on x86-64 macOS。

#include

#ifdef __APPLE__

#include

#else

#include

#endif

#include

namespace

{

constexpr

unsigned

long

；

constexpr

cl_uint

kMaxNumPlatforms

；

constexpr

cl_uint

kMaxNumDevices

；

constexpr

char

kKernelSource

［］

“（

__kernel

void

factorial

（

__global

long

unsigned

int

buffer

，

const

long

unsigned

int

）

{

const

long

unsigned

int

get_global_id

（

）；

buffer

［

］

（

）

；

for

（

long

unsigned

int

stride

；

stride

；

stride

<<=

）

{

buffer

［

］

buffer

［

stride

］；

}

）

”；

void

check

（

const

bool

condition

，

const

char

err_msg

）

{

（

！

condition

）

{

std

：：

cerr

err_msg

std

：：

endl

；

exit

（

EXIT_FAILURE

）；

}

void

check

（

const

cl_int

err

，

const

char

err_msg

）

{

（

err

！=

CL_SUCCESS

）

{

std

：：

ostringstream

merged_err_msg

；

merged_err_msg

err_msg

“ With error： ”

err

；

check

（

/* condition = */

false

，

merged_err_msg

。

str

（）。

c_str

（））；

}

// namespace

int

main

（

int

argc

，

char

argv

［］）

{

cl_platform_id

platforms

［

kMaxNumPlatforms

］；

cl_uint

num_platforms

；

cl_int

err

clGetPlatformIDs

（

kMaxNumPlatforms

，

platforms

，

num_platforms

）；

check

（

err

CL_SUCCESS

num_platforms

，

“Failed to find platforms。”

）；

cl_device_id

device_ids

［

kMaxNumDevices

］；

cl_uint

num_devices

；

err

clGetDeviceIDs

（

platforms

［

］，

CL_DEVICE_TYPE_GPU

，

kMaxNumDevices

，

device_ids

，

num_devices

）；

check

（

err

，

“Failed to find devices。”

）；

const

size_t

which_device

num_devices

；

const

cl_device_id

device_id

device_ids

［

which_device

］；

const

cl_context

context

clCreateContext

（

/* properties = */

nullptr

，

/* num_devices = */

，

device_id

，

/* devices = */

nullptr

，

/* pfn_notify = */

nullptr

，

err

）；

check

（

err

，

“Failed to create context。”

）；

const

cl_command_queue

commands

clCreateCommandQueue

（

context

，

device_ids

［

which_device

］，

/* cl_command_queue_properties = */

，

err

）；

check

（

err

，

“Failed to create command queue。”

）；

const

char

src

kKernelSource

；

const

cl_program

program

clCreateProgramWithSource

（

context

，

/* count= */

，

static_cast

const

char

**>

（

src

），

/* lengths = */

，

err

）；

check

（

err

，

“Failed to create program。”

）；

err

clBuildProgram

（

program

，

/* num_devices = */

，

/* device_list = */

nullptr

，

/* options = */

nullptr

，

/* pfn_notify = */

nullptr

，

/* user_data = */

nullptr

）；

check

（

err

，

“Failed to build program。”

）；

const

cl_kernel

kernel

clCreateKernel

（

program

，

“factorial”

，

err

）；

check

（

err

，

“Failed to create kernel。”

）；

const

size_t

log2n

static_cast

size_t

（

std

：：

ceil

（

std

：：

log2

（

）））；

const

size_t

num_threads

log2n

；

const

size_t

buffer_size

num_threads

sizeof

（

unsigned

long

）；

const

cl_mem

buffer

clCreateBuffer

（

context

，

CL_MEM_READ_WRITE

，

buffer_size

，

/* host_ptr = */

nullptr

，

err

）；

check

（

err

，

“Failed to create buffer。”

）；

err

clSetKernelArg

（

kernel

，

/* arg_index = */

，

sizeof

（

buffer

），

buffer

）；

check

（

err

，

“Failed to set kernel arg ‘buffer’。”

）；

err

clSetKernelArg

（

kernel

，

/* arg_index = */

，

sizeof

（

），

）；

check

（

err

，

“Failed to set kernel arg ‘n’。”

）；

size_t

local

；

err

clGetKernelWorkGroupInfo

（

kernel

，

device_id

，

CL_KERNEL_WORK_GROUP_SIZE

，

sizeof

（

local

），

local

，

/* param_value_size_ret = */

nullptr

）；

check

（

err

，

“Failed to get kernel work group info。”

）；

const

size_t

global

local

static_cast

size_t

（

std

：：

ceil

（

num_threads

1。0

local

））；

err

clEnqueueNDRangeKernel

（

commands

，

kernel

，

/* work_dim = */

，

/* global_work_offset = */

nullptr

，

global

，

local

，

/* num_events_in_wait_list = */

，

/* event_wait_list = */

nullptr

，

/* event = */

nullptr

）；

check

（

err

，

“Failed to execute kernel。”

）；

check

（

clFinish

（

commands

），

“Failed to finish commands。”

）；

unsigned

long

result

；

err

clEnqueueReadBuffer

（

commands

，

buffer

，

CL_TRUE

，

/* offset = */

，

sizeof

（

unsigned

long

），

result

，

/* num_events_in_wait_list = */

，

/* event_wait_list = */

nullptr

，

/* event = */

nullptr

）；

check

（

err

，

“Failed to read buffer。”

）；

std

：：

cout

result

std

：：

endl

；

check

（

clReleaseMemObject

（

buffer

），

“Failed to release buffer。”

）；

check

（

clReleaseProgram

（

program

），

“Failed to release program。”

）；

check

（

clReleaseKernel

（

kernel

），

“Failed to release kernel。”

）；

check

（

clReleaseCommandQueue

（

commands

），

“Failed to release command queue。”

）；

check

（

clReleaseContext

（

context

），

“Failed to release context。”

）；

return

；

}

寫這段程式碼的時候還以為不能用CUDA，因為它是C++的超集。感謝 @D Flip Flop 大神指出可以用CUDA Thrust，他的寫法比我手寫OpenCL簡潔太多了：