私はCUDAで次のカーネルを持っています。次の作品:クーダIDX doesntのインデックス行列が正しく
__global__ void pagerank(Node *ingoing, Node *outgoing, int N) {
int j;
int idx = threadIdx.x + blockIdx.x * blockDim.x;
if ((idx > 0) && (idx < N)){
何が問題なのですか? idxが行列を正しく索引付けしないのはなぜですか?
を行う0を印刷し、main関数の最後に出て行く[IDX] .p_t1フィールドを印刷するが、彼らは私が行うとき、正しいとき
/******************** Includes - Defines ****************/
#include "pagerank_serial.h"
#include <stdio.h>
#include <stdlib.h>
#include <time.h>
#include <math.h>
#include <assert.h>
#include <string.h>
#include <sys/time.h>
#include <fcntl.h>
#include <cuda.h>
#include "string.h"
/******************** Defines ****************/
// Number of nodes
int N;
// Convergence threashold and algorithm's parameter d
double threshold, d;
// Table of node's data
Node *Nodes;
/***** Read graph connections from txt file *****/
void Read_from_txt_file(char* filename)
FILE *fid;
int from_idx, to_idx;
int temp_size;
fid = fopen(filename, "r");
if (fid == NULL){
printf("Error opening data file\n");
while (!feof(fid))
if (fscanf(fid,"%d\t%d\n", &from_idx,&to_idx))
temp_size = Nodes[from_idx].con_size;
//Nodes[from_idx].To_id =(int*) realloc(Nodes[from_idx].To_id, temp_size * sizeof(int));
Nodes[from_idx].To_id[temp_size - 1] = to_idx;
//printf("End of connections insertion!\n");
/***** Read P vector from txt file*****/
void Read_P_from_txt_file()
FILE *fid;
double temp_P;
int index = 0;
fid = fopen("P.txt", "r");
if (fid == NULL){printf("Error opening the Probabilities file\n");}
while (!feof(fid))
// P's values are double!
if (fscanf(fid," double sum = 0;%lf\n", &temp_P))
Nodes[index].p_t1 = temp_P;
//printf("End of P insertion!");
/***** Read E vector from txt file*****/
void Read_E_from_txt_file()
FILE *fid;
double temp_E;
int index = 0;
fid = fopen("E.txt", "r");
if (fid == NULL)
printf("Error opening the E file\n");
while (!feof(fid))
// E's values are double!
if (fscanf(fid,"%lf\n", &temp_E))
Nodes[index].e = temp_E;
//printf("End of E insertion!");
/***** Create P and E with equal probability *****/
void Random_P_E()
int i;
// Sum of P (it must be =1)
double sum_P_1 = 0;
// Sum of E (it must be =1)
double sum_E_1 = 0;
// Arrays initialization
for (i = 0; i < N; i++)
Nodes[i].p_t0 = 0;
Nodes[i].p_t1 = 1;
Nodes[i].p_t1 = (double) Nodes[i].p_t1/N;
sum_P_1 = sum_P_1 + Nodes[i].p_t1;
Nodes[i].e = 1;
Nodes[i].e = (double) Nodes[i].e/N;
sum_E_1 = sum_E_1 + Nodes[i].e;
// Assert sum of probabilities is =1
// Print sum of P (it must be =1)
//printf("Sum of P = %f\n",sum_P_1);
// Exit if sum of P is !=1
assert(sum_P_1 = 1);
// Print sum of E (it must be =1)
//printf("Sum of E = %f\n",sum_E_1);
// Exit if sum of Pt0 is !=1
assert(sum_E_1 = 1);
/***** Main function *****/
int main(int argc, char** argv)
int blockSize; // The launch configurator returned block size
int minGridSize; // The minimum grid size needed to achieve the maximum occupancy for a full device launch
int gridSize; // The actual grid size needed, based on input size
// Check input arguments
if (argc < 5)
printf("Error in arguments! Three arguments required: graph filename, N, threshold and d\n");
return 0;
// get arguments
char filename[256];
strcpy(filename, argv[1]);
N = atoi(argv[2]);
threshold = atof(argv[3]);
d = atof(argv[4]);
int i;
// a constant value contributed of all nodes with connectivity = 0
// it's going to be addes to all node's new probability
// Allocate memory for N nodes
Nodes = (Node*) malloc(N * sizeof(Node));
for (i = 0; i < N; i++)
Nodes[i].con_size = 0;
//Nodes[i].To_id = (int*) malloc(sizeof(int));
// set random probabilities
Node *h_ingoing;
Node *h_outgoing;
h_ingoing = Nodes;
h_outgoing = (Node *)calloc(N, sizeof *h_outgoing);
Node *d_ingoing;
Node *d_outgoing;
cudaMalloc(&d_ingoing, N * sizeof *d_ingoing);
cudaMalloc(&d_outgoing, N * sizeof *d_outgoing);
cudaMemcpy(d_ingoing, h_ingoing, N * sizeof *h_ingoing, cudaMemcpyHostToDevice);
cudaMemcpy(d_outgoing, h_outgoing, N * sizeof *h_outgoing, cudaMemcpyHostToDevice);
float time;
cudaEvent_t begin, end;
cudaOccupancyMaxPotentialBlockSize(&minGridSize, &blockSize, pagerank, 0, N);
// Round up according to array size
gridSize = (N + blockSize - 1)/blockSize;
printf("Gridsize, blockzise : %d , %d \n", gridSize, blockSize);
cudaEventRecord(begin, 0);
pagerank<<<gridSize, blockSize>>>(d_ingoing, d_outgoing, N, threshold, d);
cudaEventRecord(end, 0);
cudaEventElapsedTime(&time, begin, end);
cudaMemcpy(h_outgoing, d_outgoing, N * sizeof *h_outgoing, cudaMemcpyDeviceToHost);
printf("%f\n", time) ;
// Print final probabilitities
for (i = 0; i <100; i++)
printf("P_t1[%d] = %f\n",i,h_outgoing[i].p_t1);
printf("End of program!\n");
return (EXIT_SUCCESS);
エラーは何ですか?私は生きているコンパイラではありません... –
グローバルカーネルを呼び出すコードがなくても、何が起きているのかを知ることは難しいですが、私はその質問を理解していると思います。 –
私はコード全体を書いた、今説明してもらえますか?ありがとう – Haris