2022-04-07 18:46:57 +02:00

317 lines
10 KiB
C++

/*
Copyright (c) 2005-2020 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#include "../../common/utility/utility.h"
#include "../../common/utility/get_default_num_threads.h"
#if __TBB_MIC_OFFLOAD
#pragma offload_attribute (push,target(mic))
#endif // __TBB_MIC_OFFLOAD
#include <cstdio>
#include <cstdlib>
#include <string>
#include <atomic>
#include "tbb/tick_count.h"
#include "tbb/task_group.h"
#include "tbb/global_control.h"
#pragma warning(disable: 4996)
const unsigned BOARD_SIZE=81;
const unsigned BOARD_DIM=9;
using namespace tbb;
using namespace std;
std::atomic<unsigned> nSols;
bool find_one = false;
bool verbose = false;
unsigned short init_values[BOARD_SIZE] = {1,0,0,9,0,0,0,8,0,0,8,0,2,0,0,0,0,0,0,0,5,0,0,0,7,0,0,0,5,2,1,0,0,4,0,0,0,0,0,0,0,5,0,0,7,4,0,0,7,0,0,0,3,0,0,3,0,0,0,2,0,0,5,0,0,0,0,0,0,1,0,0,5,0,0,0,1,0,0,0,0};
task_group *g;
double solve_time;
typedef struct {
unsigned short solved_element;
unsigned potential_set;
} board_element;
void read_board(const char *filename) {
FILE *fp;
int input;
fp = fopen(filename, "r");
if (!fp) {
fprintf(stderr, "sudoku: Could not open input file '%s'.\n", filename);
exit(1);
}
for (unsigned i=0; i<BOARD_SIZE; ++i) {
if (fscanf(fp, "%d", &input))
init_values[i] = input;
else {
fprintf(stderr, "sudoku: Error in input file at entry %d, assuming 0.\n", i);
init_values[i] = 0;
}
}
fclose(fp);
}
void print_board(board_element *b) {
for (unsigned row=0; row<BOARD_DIM; ++row) {
for (unsigned col=0; col<BOARD_DIM; ++col) {
printf(" %d", b[row*BOARD_DIM+col].solved_element);
if (col==2 || col==5) printf(" |");
}
printf("\n");
if (row==2 || row==5) printf(" ---------------------\n");
}
}
void print_potential_board(board_element *b) {
for (unsigned row=0; row<BOARD_DIM; ++row) {
for (unsigned col=0; col<BOARD_DIM; ++col) {
if (b[row*BOARD_DIM+col].solved_element)
printf(" %4d ", b[row*BOARD_DIM+col].solved_element);
else
printf(" [%4d]", b[row*BOARD_DIM+col].potential_set);
if (col==2 || col==5) printf(" |");
}
printf("\n");
if (row==2 || row==5)
printf(" ------------------------------------------------------------------\n");
}
}
void init_board(board_element *b) {
for (unsigned i=0; i<BOARD_SIZE; ++i)
b[i].solved_element = b[i].potential_set = 0;
}
void init_board(board_element *b, unsigned short arr[81]) {
for (unsigned i=0; i<BOARD_SIZE; ++i) {
b[i].solved_element = arr[i];
b[i].potential_set = 0;
}
}
void init_potentials(board_element *b) {
for (unsigned i=0; i<BOARD_SIZE; ++i)
b[i].potential_set = 0;
}
void copy_board(board_element *src, board_element *dst) {
for (unsigned i=0; i<BOARD_SIZE; ++i)
dst[i].solved_element = src[i].solved_element;
}
bool fixed_board(board_element *b) {
for (int i=BOARD_SIZE-1; i>=0; --i)
if (b[i].solved_element==0) return false;
return true;
}
bool in_row(board_element *b, unsigned row, unsigned col, unsigned short p) {
for (unsigned c=0; c<BOARD_DIM; ++c)
if (c!=col && b[row*BOARD_DIM+c].solved_element==p) return true;
return false;
}
bool in_col(board_element *b, unsigned row, unsigned col, unsigned short p) {
for (unsigned r=0; r<BOARD_DIM; ++r)
if (r!=row && b[r*BOARD_DIM+col].solved_element==p) return true;
return false;
}
bool in_block(board_element *b, unsigned row, unsigned col, unsigned short p) {
unsigned b_row = row/3 * 3, b_col = col/3 * 3;
for (unsigned i=b_row; i<b_row+3; ++i)
for (unsigned j=b_col; j<b_col+3; ++j)
if (!(i==row && j==col) && b[i*BOARD_DIM+j].solved_element==p) return true;
return false;
}
void calculate_potentials(board_element *b) {
for (unsigned i=0; i<BOARD_SIZE; ++i) {
b[i].potential_set = 0;
if (!b[i].solved_element) { // element is not yet fixed
unsigned row = i/BOARD_DIM, col = i%BOARD_DIM;
for (unsigned potential=1; potential<=BOARD_DIM; ++potential) {
if (!in_row(b, row, col, potential) && !in_col(b, row, col, potential)
&& !in_block(b, row, col, potential))
b[i].potential_set |= 1<<(potential-1);
}
}
}
}
bool valid_board(board_element *b) {
bool success=true;
for (unsigned i=0; i<BOARD_SIZE; ++i) {
if (success && b[i].solved_element) { // element is fixed
unsigned row = i/BOARD_DIM, col = i%BOARD_DIM;
if (in_row(b, row, col, b[i].solved_element) || in_col(b, row, col, b[i].solved_element) || in_block(b, row, col, b[i].solved_element))
success = false;
}
}
return success;
}
bool examine_potentials(board_element *b, bool *progress) {
bool singletons = false;
for (unsigned i=0; i<BOARD_SIZE; ++i) {
if (b[i].solved_element==0 && b[i].potential_set==0) // empty set
return false;
switch (b[i].potential_set) {
case 1: { b[i].solved_element = 1; singletons=true; break; }
case 2: { b[i].solved_element = 2; singletons=true; break; }
case 4: { b[i].solved_element = 3; singletons=true; break; }
case 8: { b[i].solved_element = 4; singletons=true; break; }
case 16: { b[i].solved_element = 5; singletons=true; break; }
case 32: { b[i].solved_element = 6; singletons=true; break; }
case 64: { b[i].solved_element = 7; singletons=true; break; }
case 128: { b[i].solved_element = 8; singletons=true; break; }
case 256: { b[i].solved_element = 9; singletons=true; break; }
}
}
*progress = singletons;
return valid_board(b);
}
#if !__TBB_CPP11_LAMBDAS_PRESENT
void partial_solve(board_element *b, unsigned first_potential_set);
class PartialSolveBoard {
board_element *b;
unsigned first_potential_set;
public:
PartialSolveBoard(board_element *_b, unsigned fps) :
b(_b), first_potential_set(fps) {}
void operator() () const {
partial_solve(b, first_potential_set);
}
};
#endif
void partial_solve(board_element *b, unsigned first_potential_set) {
if (fixed_board(b)) {
if ( find_one )
g->cancel();
if (++nSols==1 && verbose) {
print_board(b);
}
free(b);
return;
}
calculate_potentials(b);
bool progress=true;
bool success = examine_potentials(b, &progress);
if (success && progress) {
partial_solve(b, first_potential_set);
} else if (success && !progress) {
board_element *new_board;
while (b[first_potential_set].solved_element!=0) ++first_potential_set;
for (unsigned short potential=1; potential<=BOARD_DIM; ++potential) {
if (1<<(potential-1) & b[first_potential_set].potential_set) {
new_board = (board_element *)malloc(BOARD_SIZE*sizeof(board_element));
copy_board(b, new_board);
new_board[first_potential_set].solved_element = potential;
#if __TBB_CPP11_LAMBDAS_PRESENT
g->run( [=]{ partial_solve(new_board, first_potential_set); } );
#else
g->run(PartialSolveBoard(new_board, first_potential_set));
#endif
}
}
free(b);
}
else {
free(b);
}
}
unsigned solve(int p) {
tbb::global_control c(tbb::global_control::max_allowed_parallelism, p);
nSols = 0;
board_element *start_board = (board_element *)malloc(BOARD_SIZE*sizeof(board_element));
init_board(start_board, init_values);
g = new task_group;
tick_count t0 = tick_count::now();
partial_solve(start_board, 0);
g->wait();
solve_time = (tick_count::now() - t0).seconds();
delete g;
return nSols;
}
#if __TBB_MIC_OFFLOAD
#pragma offload_attribute (pop)
#endif // __TBB_MIC_OFFLOAD
int main(int argc, char *argv[]) {
try {
tbb::tick_count mainStartTime = tbb::tick_count::now();
utility::thread_number_range threads(utility::get_default_num_threads);
string filename = "";
bool silent = false;
utility::parse_cli_arguments(argc,argv,
utility::cli_argument_pack()
//"-h" option for displaying help is present implicitly
.positional_arg(threads,"n-of-threads",utility::thread_number_range_desc)
.positional_arg(filename,"filename","input filename")
.arg(verbose,"verbose","prints the first solution")
.arg(silent,"silent","no output except elapsed time")
.arg(find_one,"find-one","stops after finding first solution\n")
);
if ( silent ) verbose = false;
if ( !filename.empty() )
read_board( filename.c_str() );
// otherwise (if file name not specified), the default statically initialized board will be used.
for(int p = threads.first; p <= threads.last; p = threads.step(p) ) {
unsigned number;
#if __TBB_MIC_OFFLOAD
#pragma offload target(mic) in(init_values, p, verbose, find_one) out(number, solve_time)
{
#endif // __TBB_MIC_OFFLOAD
number = solve(p);
#if __TBB_MIC_OFFLOAD
}
#endif // __TBB_MIC_OFFLOAD
if ( !silent ) {
if ( find_one ) {
printf("Sudoku: Time to find first solution on %d threads: %6.6f seconds.\n", p, solve_time);
}
else {
printf("Sudoku: Time to find all %u solutions on %d threads: %6.6f seconds.\n", number, p, solve_time);
}
}
}
utility::report_elapsed_time((tbb::tick_count::now() - mainStartTime).seconds());
return 0;
} catch(std::exception& e) {
std::cerr<<"error occurred. error text is :\"" <<e.what()<<"\"\n";
return 1;
}
};